***************
** Arguments **
***************
backbone: 
config_file: configs/trainers/ProDA/vit_b16_ep50_c4_BZ4_ProDA.yaml
dataset_config_file: configs/datasets/imagenet.yaml
eval_only: False
head: 
load_epoch: None
model_dir: 
no_train: False
opts: ['DATASET.NUM_SHOTS', '16', 'DATASET.SUBSAMPLE_CLASSES', 'base']
output_dir: output/base2new/train_base/imagenet/vit_b16_ep50_c4_BZ4_ProDA/seed1
resume: 
root: /mnt/hdd/DATA
seed: 1
source_domains: None
target_domains: None
trainer: ProDA
transforms: None
************
** Config **
************
DATALOADER:
  K_TRANSFORMS: 1
  NUM_WORKERS: 8
  RETURN_IMG0: False
  TEST:
    BATCH_SIZE: 100
    SAMPLER: SequentialSampler
  TRAIN_U:
    BATCH_SIZE: 32
    N_DOMAIN: 0
    N_INS: 16
    SAME_AS_X: True
    SAMPLER: RandomSampler
  TRAIN_X:
    BATCH_SIZE: 4
    N_DOMAIN: 0
    N_INS: 16
    SAMPLER: RandomSampler
DATASET:
  ALL_AS_UNLABELED: False
  CIFAR_C_LEVEL: 1
  CIFAR_C_TYPE: 
  NAME: ImageNet
  NUM_LABELED: -1
  NUM_SHOTS: 16
  ROOT: /mnt/hdd/DATA
  SOURCE_DOMAINS: ()
  STL10_FOLD: -1
  SUBSAMPLE_CLASSES: base
  TARGET_DOMAINS: ()
  VAL_PERCENT: 0.1
INPUT:
  COLORJITTER_B: 0.4
  COLORJITTER_C: 0.4
  COLORJITTER_H: 0.1
  COLORJITTER_S: 0.4
  CROP_PADDING: 4
  CUTOUT_LEN: 16
  CUTOUT_N: 1
  GB_K: 21
  GB_P: 0.5
  GN_MEAN: 0.0
  GN_STD: 0.15
  INTERPOLATION: bicubic
  NO_TRANSFORM: False
  PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
  PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
  RANDAUGMENT_M: 10
  RANDAUGMENT_N: 2
  RGS_P: 0.2
  RRCROP_SCALE: (0.08, 1.0)
  SIZE: (224, 224)
  TRANSFORMS: ('random_resized_crop', 'random_flip', 'normalize')
MODEL:
  BACKBONE:
    NAME: ViT-B/16
    PRETRAINED: True
  HEAD:
    ACTIVATION: relu
    BN: True
    DROPOUT: 0.0
    HIDDEN_LAYERS: ()
    NAME: 
  INIT_WEIGHTS: 
OPTIM:
  ADAM_BETA1: 0.9
  ADAM_BETA2: 0.999
  BASE_LR_MULT: 0.1
  GAMMA: 0.1
  LR: 0.002
  LR_SCHEDULER: cosine
  MAX_EPOCH: 50
  MOMENTUM: 0.9
  NAME: sgd
  NEW_LAYERS: ()
  RMSPROP_ALPHA: 0.99
  SGD_DAMPNING: 0
  SGD_NESTEROV: False
  STAGED_LR: False
  STEPSIZE: (-1,)
  WARMUP_CONS_LR: 1e-05
  WARMUP_EPOCH: 5
  WARMUP_MIN_LR: 1e-05
  WARMUP_RECOUNT: True
  WARMUP_TYPE: constant
  WEIGHT_DECAY: 0.0005
OUTPUT_DIR: output/base2new/train_base/imagenet/vit_b16_ep50_c4_BZ4_ProDA/seed1
RESUME: 
SEED: 1
TEST:
  COMPUTE_CMAT: False
  EVALUATOR: Classification
  FINAL_MODEL: last_step
  NO_TEST: False
  PER_CLASS_RESULT: False
  SPLIT: test
TRAIN:
  CHECKPOINT_FREQ: 0
  COUNT_ITER: train_x
  PRINT_FREQ: 20
TRAINER:
  CDAC:
    CLASS_LR_MULTI: 10
    P_THRESH: 0.95
    RAMPUP_COEF: 30
    RAMPUP_ITRS: 1000
    STRONG_TRANSFORMS: ()
    TOPK_MATCH: 5
  COCOOP:
    CTX_INIT: 
    N_CTX: 16
    PREC: fp16
  COOP:
    CLASS_TOKEN_POSITION: end
    CSC: False
    CTX_INIT: 
    N_CTX: 16
    PREC: fp16
  CROSSGRAD:
    ALPHA_D: 0.5
    ALPHA_F: 0.5
    EPS_D: 1.0
    EPS_F: 1.0
  DAEL:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 0.5
  DAELDG:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 0.5
  DDAIG:
    ALPHA: 0.5
    CLAMP: False
    CLAMP_MAX: 1.0
    CLAMP_MIN: -1.0
    G_ARCH: 
    LMDA: 0.3
    WARMUP: 0
  DOMAINMIX:
    ALPHA: 1.0
    BETA: 1.0
    TYPE: crossdomain
  ENTMIN:
    LMDA: 0.001
  FIXMATCH:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 1.0
  IVLP:
    CTX_INIT: a photo of a
    N_CTX_TEXT: 2
    N_CTX_VISION: 2
    PREC: fp16
    PROMPT_DEPTH_TEXT: 9
    PROMPT_DEPTH_VISION: 9
  M3SDA:
    LMDA: 0.5
    N_STEP_F: 4
  MAPLE:
    CTX_INIT: a photo of a
    N_CTX: 4
    PREC: fp16
    PROMPT_DEPTH: 9
  MCD:
    N_STEP_F: 4
  MEANTEACHER:
    EMA_ALPHA: 0.999
    RAMPUP: 5
    WEIGHT_U: 1.0
  MIXMATCH:
    MIXUP_BETA: 0.75
    RAMPUP: 20000
    TEMP: 2.0
    WEIGHT_U: 100.0
  MME:
    LMDA: 0.1
  NAME: ProDA
  ProDA:
    N_CTX: 4
    N_PROMPT: 32
    PREC: fp16
  SE:
    CONF_THRE: 0.95
    EMA_ALPHA: 0.999
    RAMPUP: 300
  VPT:
    CTX_INIT: a photo of a
    N_CTX_VISION: 2
    PREC: fp16
    PROMPT_DEPTH_VISION: 1
USE_CUDA: True
VERBOSE: True
VERSION: 1
Collecting env info ...
** System info **
PyTorch version: 2.2.1+cu121
Is debug build: False
CUDA used to build PyTorch: 12.1
ROCM used to build PyTorch: N/A

OS: Debian GNU/Linux 12 (bookworm) (x86_64)
GCC version: (Debian 12.2.0-14) 12.2.0
Clang version: Could not collect
CMake version: Could not collect
Libc version: glibc-2.36

Python version: 3.11.2 (main, Mar 13 2023, 12:18:29) [GCC 12.2.0] (64-bit runtime)
Python platform: Linux-6.5.13-3-pve-x86_64-with-glibc2.36
Is CUDA available: True
CUDA runtime version: 11.8.89
CUDA_MODULE_LOADING set to: LAZY
GPU models and configuration: 
GPU 0: NVIDIA A800 80GB PCIe
GPU 1: NVIDIA A800 80GB PCIe

Nvidia driver version: 525.147.05
cuDNN version: Could not collect
HIP runtime version: N/A
MIOpen runtime version: N/A
Is XNNPACK available: True

CPU:
Architecture:                       x86_64
CPU op-mode(s):                     32-bit, 64-bit
Address sizes:                      46 bits physical, 57 bits virtual
Byte Order:                         Little Endian
CPU(s):                             64
On-line CPU(s) list:                18,20,22,23,25-27,29,31,32,34,37,46-49
Off-line CPU(s) list:               0-17,19,21,24,28,30,33,35,36,38-45,50-63
Vendor ID:                          GenuineIntel
Model name:                         Intel(R) Xeon(R) Gold 6326 CPU @ 2.90GHz
CPU family:                         6
Model:                              106
Thread(s) per core:                 2
Core(s) per socket:                 16
Socket(s):                          2
Stepping:                           6
CPU(s) scaling MHz:                 98%
CPU max MHz:                        3500.0000
CPU min MHz:                        800.0000
BogoMIPS:                           5800.00
Flags:                              fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp lm constant_tsc art arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc cpuid aperfmperf pni pclmulqdq dtes64 ds_cpl vmx smx est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid dca sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm 3dnowprefetch cpuid_fault epb cat_l3 invpcid_single intel_ppin ssbd mba ibrs ibpb stibp ibrs_enhanced tpr_shadow flexpriority ept vpid ept_ad fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid cqm rdt_a avx512f avx512dq rdseed adx smap avx512ifma clflushopt clwb intel_pt avx512cd sha_ni avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves cqm_llc cqm_occup_llc cqm_mbm_total cqm_mbm_local split_lock_detect wbnoinvd dtherm ida arat pln pts vnmi avx512vbmi umip pku ospke avx512_vbmi2 gfni vaes vpclmulqdq avx512_vnni avx512_bitalg tme avx512_vpopcntdq la57 rdpid fsrm md_clear pconfig flush_l1d arch_capabilities
Virtualization:                     VT-x
L1d cache:                          1.5 MiB (32 instances)
L1i cache:                          1 MiB (32 instances)
L2 cache:                           40 MiB (32 instances)
L3 cache:                           48 MiB (2 instances)
NUMA node(s):                       2
NUMA node0 CPU(s):                  0-15,32-47
NUMA node1 CPU(s):                  16-31,48-63
Vulnerability Gather data sampling: Vulnerable: No microcode
Vulnerability Itlb multihit:        Not affected
Vulnerability L1tf:                 Not affected
Vulnerability Mds:                  Not affected
Vulnerability Meltdown:             Not affected
Vulnerability Mmio stale data:      Mitigation; Clear CPU buffers; SMT vulnerable
Vulnerability Retbleed:             Not affected
Vulnerability Spec rstack overflow: Not affected
Vulnerability Spec store bypass:    Mitigation; Speculative Store Bypass disabled via prctl
Vulnerability Spectre v1:           Mitigation; usercopy/swapgs barriers and __user pointer sanitization
Vulnerability Spectre v2:           Mitigation; Enhanced / Automatic IBRS, IBPB conditional, RSB filling, PBRSB-eIBRS SW sequence
Vulnerability Srbds:                Not affected
Vulnerability Tsx async abort:      Not affected

Versions of relevant libraries:
[pip3] flake8==3.7.9
[pip3] flake8==3.7.9
[pip3] numpy==1.26.4
[pip3] torch==2.2.1
[pip3] torchaudio==2.2.1
[pip3] torchvision==0.17.1
[pip3] triton==2.2.0
[conda] Could not collect
        Pillow (10.2.0)

Loading trainer: ProDA
Loading dataset: ImageNet
Loading preprocessed few-shot data from /mnt/hdd/DATA/imagenet/split_fewshot/shot_16_shuffled-seed_1.pkl
SUBSAMPLE BASE CLASSES!
Building transform_train
+ random resized crop (size=(224, 224), scale=(0.08, 1.0))
+ random flip
+ to torch tensor of range [0, 1]
+ normalization (mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])
Building transform_test
+ resize the smaller edge to 224
+ 224x224 center crop
+ to torch tensor of range [0, 1]
+ normalization (mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])
---------  --------
Dataset    ImageNet
# classes  500
# train_x  8,000
# val      25,000
# test     25,000
---------  --------
Loading CLIP (backbone: ViT-B/16)
Building custom CLIP
Turning off gradients in both the image and the text encoder
Parameters to be updated: {'prompt_learner.ctx'}
Loading evaluator: Classification
No checkpoint found, train from scratch
Initialize tensorboard (log_dir=output/base2new/train_base/imagenet/vit_b16_ep50_c4_BZ4_ProDA/seed1/tensorboard)
epoch [1/50] batch [20/2000] time 2.013 (2.167) data 0.000 (0.029) loss 2.1227 (2.1939) lr 1.0000e-05 eta 2 days, 12:11:33
epoch [1/50] batch [40/2000] time 2.064 (2.102) data 0.000 (0.015) loss 0.3423 (2.0640) lr 1.0000e-05 eta 2 days, 10:21:12
epoch [1/50] batch [60/2000] time 2.019 (2.083) data 0.001 (0.010) loss 1.1633 (2.0956) lr 1.0000e-05 eta 2 days, 9:49:09
epoch [1/50] batch [80/2000] time 2.010 (2.073) data 0.000 (0.008) loss 0.3753 (2.0437) lr 1.0000e-05 eta 2 days, 9:31:43
epoch [1/50] batch [100/2000] time 2.064 (2.067) data 0.000 (0.006) loss 1.2695 (2.0316) lr 1.0000e-05 eta 2 days, 9:20:48
epoch [1/50] batch [120/2000] time 2.057 (2.061) data 0.000 (0.005) loss 1.6411 (2.0354) lr 1.0000e-05 eta 2 days, 9:11:35
epoch [1/50] batch [140/2000] time 2.001 (2.057) data 0.001 (0.004) loss 0.8574 (2.0169) lr 1.0000e-05 eta 2 days, 9:02:56
epoch [1/50] batch [160/2000] time 2.034 (2.055) data 0.000 (0.004) loss 2.1400 (2.0276) lr 1.0000e-05 eta 2 days, 8:58:52
epoch [1/50] batch [180/2000] time 2.003 (2.053) data 0.000 (0.003) loss 0.7903 (2.0475) lr 1.0000e-05 eta 2 days, 8:55:04
epoch [1/50] batch [200/2000] time 2.060 (2.051) data 0.000 (0.003) loss 2.0325 (2.0498) lr 1.0000e-05 eta 2 days, 8:51:48
epoch [1/50] batch [220/2000] time 2.010 (2.050) data 0.000 (0.003) loss 2.3585 (2.0713) lr 1.0000e-05 eta 2 days, 8:49:02
epoch [1/50] batch [240/2000] time 2.060 (2.049) data 0.000 (0.003) loss 1.8028 (2.0589) lr 1.0000e-05 eta 2 days, 8:46:52
epoch [1/50] batch [260/2000] time 1.987 (2.048) data 0.000 (0.002) loss 2.2631 (2.0468) lr 1.0000e-05 eta 2 days, 8:44:08
epoch [1/50] batch [280/2000] time 2.006 (2.047) data 0.000 (0.002) loss 3.2681 (2.0445) lr 1.0000e-05 eta 2 days, 8:42:51
epoch [1/50] batch [300/2000] time 2.059 (2.047) data 0.000 (0.002) loss 1.3165 (2.0141) lr 1.0000e-05 eta 2 days, 8:41:21
epoch [1/50] batch [320/2000] time 2.064 (2.047) data 0.000 (0.002) loss 2.1594 (2.0332) lr 1.0000e-05 eta 2 days, 8:40:11
epoch [1/50] batch [340/2000] time 2.057 (2.046) data 0.000 (0.002) loss 2.2711 (2.0458) lr 1.0000e-05 eta 2 days, 8:38:01
epoch [1/50] batch [360/2000] time 1.983 (2.045) data 0.000 (0.002) loss 1.8883 (2.0477) lr 1.0000e-05 eta 2 days, 8:36:18
epoch [1/50] batch [380/2000] time 2.039 (2.045) data 0.000 (0.002) loss 2.3203 (2.0514) lr 1.0000e-05 eta 2 days, 8:35:34
epoch [1/50] batch [400/2000] time 2.009 (2.045) data 0.000 (0.002) loss 1.2347 (2.0441) lr 1.0000e-05 eta 2 days, 8:34:04
epoch [1/50] batch [420/2000] time 2.015 (2.044) data 0.000 (0.002) loss 2.7100 (2.0454) lr 1.0000e-05 eta 2 days, 8:33:07
epoch [1/50] batch [440/2000] time 2.061 (2.044) data 0.000 (0.002) loss 2.5039 (2.0325) lr 1.0000e-05 eta 2 days, 8:32:00
epoch [1/50] batch [460/2000] time 2.031 (2.044) data 0.000 (0.001) loss 0.3548 (2.0432) lr 1.0000e-05 eta 2 days, 8:30:26
epoch [1/50] batch [480/2000] time 2.037 (2.044) data 0.000 (0.001) loss 2.9801 (2.0361) lr 1.0000e-05 eta 2 days, 8:29:57
epoch [1/50] batch [500/2000] time 2.063 (2.044) data 0.000 (0.001) loss 0.6564 (2.0362) lr 1.0000e-05 eta 2 days, 8:28:56
epoch [1/50] batch [520/2000] time 2.016 (2.043) data 0.000 (0.001) loss 0.3925 (2.0244) lr 1.0000e-05 eta 2 days, 8:28:00
epoch [1/50] batch [540/2000] time 2.063 (2.043) data 0.000 (0.001) loss 1.1857 (2.0121) lr 1.0000e-05 eta 2 days, 8:26:54
epoch [1/50] batch [560/2000] time 2.004 (2.043) data 0.000 (0.001) loss 3.4861 (2.0064) lr 1.0000e-05 eta 2 days, 8:25:56
epoch [1/50] batch [580/2000] time 2.037 (2.043) data 0.000 (0.001) loss 3.5704 (2.0129) lr 1.0000e-05 eta 2 days, 8:25:06
epoch [1/50] batch [600/2000] time 2.031 (2.043) data 0.001 (0.001) loss 3.5146 (2.0002) lr 1.0000e-05 eta 2 days, 8:24:07
epoch [1/50] batch [620/2000] time 2.048 (2.043) data 0.000 (0.001) loss 2.6626 (1.9863) lr 1.0000e-05 eta 2 days, 8:23:17
epoch [1/50] batch [640/2000] time 2.058 (2.042) data 0.000 (0.001) loss 3.0452 (1.9841) lr 1.0000e-05 eta 2 days, 8:22:01
epoch [1/50] batch [660/2000] time 2.047 (2.042) data 0.000 (0.001) loss 1.9926 (1.9685) lr 1.0000e-05 eta 2 days, 8:20:56
epoch [1/50] batch [680/2000] time 2.030 (2.042) data 0.000 (0.001) loss 3.4905 (1.9790) lr 1.0000e-05 eta 2 days, 8:20:15
epoch [1/50] batch [700/2000] time 2.005 (2.042) data 0.000 (0.001) loss 2.1690 (1.9722) lr 1.0000e-05 eta 2 days, 8:19:18
epoch [1/50] batch [720/2000] time 2.061 (2.042) data 0.000 (0.001) loss 2.3655 (1.9764) lr 1.0000e-05 eta 2 days, 8:18:30
epoch [1/50] batch [740/2000] time 2.010 (2.042) data 0.000 (0.001) loss 2.8979 (1.9846) lr 1.0000e-05 eta 2 days, 8:17:20
epoch [1/50] batch [760/2000] time 1.980 (2.041) data 0.000 (0.001) loss 2.5623 (1.9821) lr 1.0000e-05 eta 2 days, 8:16:18
epoch [1/50] batch [780/2000] time 2.006 (2.041) data 0.000 (0.001) loss 1.9579 (1.9835) lr 1.0000e-05 eta 2 days, 8:15:19
epoch [1/50] batch [800/2000] time 2.032 (2.041) data 0.000 (0.001) loss 0.1355 (1.9656) lr 1.0000e-05 eta 2 days, 8:14:23
epoch [1/50] batch [820/2000] time 2.054 (2.041) data 0.000 (0.001) loss 0.5252 (1.9594) lr 1.0000e-05 eta 2 days, 8:13:16
epoch [1/50] batch [840/2000] time 2.059 (2.041) data 0.000 (0.001) loss 0.7086 (1.9519) lr 1.0000e-05 eta 2 days, 8:12:23
epoch [1/50] batch [860/2000] time 2.006 (2.041) data 0.000 (0.001) loss 0.1603 (1.9537) lr 1.0000e-05 eta 2 days, 8:11:36
epoch [1/50] batch [880/2000] time 2.036 (2.041) data 0.000 (0.001) loss 0.7006 (1.9428) lr 1.0000e-05 eta 2 days, 8:10:59
epoch [1/50] batch [900/2000] time 2.065 (2.041) data 0.000 (0.001) loss 3.3179 (1.9432) lr 1.0000e-05 eta 2 days, 8:10:16
epoch [1/50] batch [920/2000] time 2.006 (2.041) data 0.000 (0.001) loss 2.3235 (1.9305) lr 1.0000e-05 eta 2 days, 8:09:41
epoch [1/50] batch [940/2000] time 2.061 (2.041) data 0.000 (0.001) loss 0.0345 (1.9199) lr 1.0000e-05 eta 2 days, 8:09:09
epoch [1/50] batch [960/2000] time 2.035 (2.041) data 0.000 (0.001) loss 2.7648 (1.9154) lr 1.0000e-05 eta 2 days, 8:08:29
epoch [1/50] batch [980/2000] time 2.015 (2.041) data 0.000 (0.001) loss 1.7825 (1.9154) lr 1.0000e-05 eta 2 days, 8:07:51
epoch [1/50] batch [1000/2000] time 2.066 (2.041) data 0.000 (0.001) loss 1.4213 (1.9110) lr 1.0000e-05 eta 2 days, 8:06:59
epoch [1/50] batch [1020/2000] time 2.012 (2.041) data 0.000 (0.001) loss 1.2812 (1.9101) lr 1.0000e-05 eta 2 days, 8:06:14
epoch [1/50] batch [1040/2000] time 2.008 (2.041) data 0.000 (0.001) loss 2.2342 (1.9057) lr 1.0000e-05 eta 2 days, 8:05:32
epoch [1/50] batch [1060/2000] time 2.065 (2.041) data 0.000 (0.001) loss 1.7151 (1.8958) lr 1.0000e-05 eta 2 days, 8:05:01
epoch [1/50] batch [1080/2000] time 2.017 (2.041) data 0.000 (0.001) loss 2.9229 (1.8866) lr 1.0000e-05 eta 2 days, 8:04:15
epoch [1/50] batch [1100/2000] time 1.987 (2.041) data 0.000 (0.001) loss 1.3362 (1.8829) lr 1.0000e-05 eta 2 days, 8:03:32
epoch [1/50] batch [1120/2000] time 2.062 (2.040) data 0.000 (0.001) loss 1.9548 (1.8739) lr 1.0000e-05 eta 2 days, 8:02:41
epoch [1/50] batch [1140/2000] time 2.006 (2.040) data 0.001 (0.001) loss 1.4270 (1.8709) lr 1.0000e-05 eta 2 days, 8:01:44
epoch [1/50] batch [1160/2000] time 2.063 (2.040) data 0.000 (0.001) loss 2.2954 (1.8677) lr 1.0000e-05 eta 2 days, 8:01:06
epoch [1/50] batch [1180/2000] time 2.038 (2.040) data 0.000 (0.001) loss 2.4941 (1.8732) lr 1.0000e-05 eta 2 days, 8:00:09
epoch [1/50] batch [1200/2000] time 2.008 (2.040) data 0.000 (0.001) loss 0.5365 (1.8690) lr 1.0000e-05 eta 2 days, 7:59:22
epoch [1/50] batch [1220/2000] time 2.050 (2.040) data 0.000 (0.001) loss 1.6643 (1.8631) lr 1.0000e-05 eta 2 days, 7:58:38
epoch [1/50] batch [1240/2000] time 2.065 (2.040) data 0.000 (0.001) loss 2.0308 (1.8584) lr 1.0000e-05 eta 2 days, 7:58:00
epoch [1/50] batch [1260/2000] time 2.034 (2.040) data 0.000 (0.001) loss 0.5015 (1.8522) lr 1.0000e-05 eta 2 days, 7:57:22
epoch [1/50] batch [1280/2000] time 2.058 (2.040) data 0.000 (0.001) loss 2.1927 (1.8485) lr 1.0000e-05 eta 2 days, 7:56:37
epoch [1/50] batch [1300/2000] time 2.054 (2.040) data 0.000 (0.001) loss 0.9532 (1.8444) lr 1.0000e-05 eta 2 days, 7:55:55
epoch [1/50] batch [1320/2000] time 2.000 (2.040) data 0.000 (0.001) loss 0.5231 (1.8405) lr 1.0000e-05 eta 2 days, 7:54:59
epoch [1/50] batch [1340/2000] time 2.002 (2.040) data 0.000 (0.001) loss 1.4172 (1.8401) lr 1.0000e-05 eta 2 days, 7:54:11
epoch [1/50] batch [1360/2000] time 2.059 (2.040) data 0.000 (0.001) loss 0.3751 (1.8368) lr 1.0000e-05 eta 2 days, 7:53:22
epoch [1/50] batch [1380/2000] time 2.006 (2.040) data 0.000 (0.001) loss 2.1277 (1.8365) lr 1.0000e-05 eta 2 days, 7:52:40
epoch [1/50] batch [1400/2000] time 1.981 (2.040) data 0.000 (0.001) loss 0.7444 (1.8376) lr 1.0000e-05 eta 2 days, 7:51:48
epoch [1/50] batch [1420/2000] time 1.984 (2.039) data 0.000 (0.001) loss 4.0419 (1.8365) lr 1.0000e-05 eta 2 days, 7:50:52
epoch [1/50] batch [1440/2000] time 2.005 (2.040) data 0.000 (0.001) loss 0.2964 (1.8270) lr 1.0000e-05 eta 2 days, 7:50:16
epoch [1/50] batch [1460/2000] time 2.031 (2.039) data 0.000 (0.001) loss 2.9348 (1.8259) lr 1.0000e-05 eta 2 days, 7:49:21
epoch [1/50] batch [1480/2000] time 2.034 (2.039) data 0.000 (0.001) loss 1.7391 (1.8255) lr 1.0000e-05 eta 2 days, 7:48:37
epoch [1/50] batch [1500/2000] time 2.056 (2.039) data 0.000 (0.001) loss 0.6031 (1.8233) lr 1.0000e-05 eta 2 days, 7:47:55
epoch [1/50] batch [1520/2000] time 2.057 (2.039) data 0.000 (0.001) loss 0.3969 (1.8194) lr 1.0000e-05 eta 2 days, 7:47:14
epoch [1/50] batch [1540/2000] time 2.031 (2.039) data 0.000 (0.001) loss 0.5719 (1.8233) lr 1.0000e-05 eta 2 days, 7:46:36
epoch [1/50] batch [1560/2000] time 2.006 (2.039) data 0.000 (0.001) loss 1.0881 (1.8185) lr 1.0000e-05 eta 2 days, 7:45:53
epoch [1/50] batch [1580/2000] time 2.034 (2.039) data 0.000 (0.001) loss 0.8203 (1.8099) lr 1.0000e-05 eta 2 days, 7:45:10
epoch [1/50] batch [1600/2000] time 2.010 (2.039) data 0.000 (0.001) loss 1.8754 (1.8111) lr 1.0000e-05 eta 2 days, 7:44:19
epoch [1/50] batch [1620/2000] time 2.060 (2.039) data 0.000 (0.001) loss 0.8924 (1.8097) lr 1.0000e-05 eta 2 days, 7:43:41
epoch [1/50] batch [1640/2000] time 2.034 (2.039) data 0.000 (0.001) loss 1.0319 (1.8094) lr 1.0000e-05 eta 2 days, 7:42:54
epoch [1/50] batch [1660/2000] time 2.057 (2.039) data 0.000 (0.001) loss 2.2022 (1.8054) lr 1.0000e-05 eta 2 days, 7:42:12
epoch [1/50] batch [1680/2000] time 2.055 (2.039) data 0.001 (0.001) loss 0.8197 (1.8059) lr 1.0000e-05 eta 2 days, 7:41:28
epoch [1/50] batch [1700/2000] time 2.037 (2.039) data 0.000 (0.001) loss 1.0196 (1.8061) lr 1.0000e-05 eta 2 days, 7:40:45
epoch [1/50] batch [1720/2000] time 2.059 (2.039) data 0.000 (0.001) loss 1.3648 (1.8028) lr 1.0000e-05 eta 2 days, 7:40:09
epoch [1/50] batch [1740/2000] time 2.034 (2.039) data 0.000 (0.001) loss 1.9857 (1.8035) lr 1.0000e-05 eta 2 days, 7:39:32
epoch [1/50] batch [1760/2000] time 2.005 (2.039) data 0.000 (0.001) loss 1.6327 (1.7988) lr 1.0000e-05 eta 2 days, 7:38:38
epoch [1/50] batch [1780/2000] time 2.058 (2.039) data 0.000 (0.001) loss 1.3433 (1.7973) lr 1.0000e-05 eta 2 days, 7:37:48
epoch [1/50] batch [1800/2000] time 2.077 (2.039) data 0.000 (0.001) loss 1.0258 (1.7940) lr 1.0000e-05 eta 2 days, 7:37:07
epoch [1/50] batch [1820/2000] time 2.054 (2.039) data 0.000 (0.001) loss 1.6055 (1.7883) lr 1.0000e-05 eta 2 days, 7:36:19
epoch [1/50] batch [1840/2000] time 2.004 (2.039) data 0.000 (0.001) loss 1.3506 (1.7886) lr 1.0000e-05 eta 2 days, 7:35:37
epoch [1/50] batch [1860/2000] time 2.057 (2.039) data 0.000 (0.001) loss 0.3159 (1.7858) lr 1.0000e-05 eta 2 days, 7:34:57
epoch [1/50] batch [1880/2000] time 2.031 (2.039) data 0.000 (0.001) loss 2.3190 (1.7832) lr 1.0000e-05 eta 2 days, 7:34:13
epoch [1/50] batch [1900/2000] time 2.005 (2.039) data 0.000 (0.001) loss 3.8007 (1.7845) lr 1.0000e-05 eta 2 days, 7:33:34
epoch [1/50] batch [1920/2000] time 2.003 (2.039) data 0.000 (0.001) loss 1.2579 (1.7833) lr 1.0000e-05 eta 2 days, 7:32:43
epoch [1/50] batch [1940/2000] time 2.055 (2.039) data 0.000 (0.001) loss 0.7836 (1.7810) lr 1.0000e-05 eta 2 days, 7:31:55
epoch [1/50] batch [1960/2000] time 2.056 (2.039) data 0.000 (0.001) loss 2.7877 (1.7777) lr 1.0000e-05 eta 2 days, 7:31:07
epoch [1/50] batch [1980/2000] time 2.004 (2.039) data 0.000 (0.001) loss 0.7787 (1.7756) lr 1.0000e-05 eta 2 days, 7:30:23
epoch [1/50] batch [2000/2000] time 2.004 (2.039) data 0.000 (0.001) loss 2.4670 (1.7755) lr 1.0000e-05 eta 2 days, 7:29:41
epoch [2/50] batch [20/2000] time 2.059 (2.066) data 0.000 (0.028) loss 0.4558 (1.5999) lr 1.0000e-05 eta 2 days, 8:13:33
epoch [2/50] batch [40/2000] time 1.980 (2.046) data 0.000 (0.014) loss 0.9792 (1.5228) lr 1.0000e-05 eta 2 days, 7:41:09
epoch [2/50] batch [60/2000] time 2.054 (2.043) data 0.001 (0.010) loss 2.3247 (1.5094) lr 1.0000e-05 eta 2 days, 7:34:45
epoch [2/50] batch [80/2000] time 2.055 (2.041) data 0.000 (0.007) loss 1.5002 (1.4525) lr 1.0000e-05 eta 2 days, 7:31:16
epoch [2/50] batch [100/2000] time 2.029 (2.040) data 0.000 (0.006) loss 2.5632 (1.5122) lr 1.0000e-05 eta 2 days, 7:28:03
epoch [2/50] batch [120/2000] time 2.003 (2.038) data 0.000 (0.005) loss 0.1417 (1.5158) lr 1.0000e-05 eta 2 days, 7:25:04
epoch [2/50] batch [140/2000] time 2.033 (2.037) data 0.000 (0.004) loss 0.4362 (1.5742) lr 1.0000e-05 eta 2 days, 7:22:51
epoch [2/50] batch [160/2000] time 2.036 (2.037) data 0.000 (0.004) loss 0.4053 (1.5534) lr 1.0000e-05 eta 2 days, 7:21:15
epoch [2/50] batch [180/2000] time 2.005 (2.037) data 0.000 (0.003) loss 0.2172 (1.5562) lr 1.0000e-05 eta 2 days, 7:20:25
epoch [2/50] batch [200/2000] time 2.068 (2.037) data 0.000 (0.003) loss 3.3465 (1.5823) lr 1.0000e-05 eta 2 days, 7:20:48
epoch [2/50] batch [220/2000] time 2.011 (2.037) data 0.000 (0.003) loss 2.0582 (1.5888) lr 1.0000e-05 eta 2 days, 7:20:06
epoch [2/50] batch [240/2000] time 2.053 (2.037) data 0.000 (0.003) loss 1.4129 (1.6117) lr 1.0000e-05 eta 2 days, 7:19:29
epoch [2/50] batch [260/2000] time 2.057 (2.037) data 0.000 (0.002) loss 1.9918 (1.6078) lr 1.0000e-05 eta 2 days, 7:18:18
epoch [2/50] batch [280/2000] time 2.057 (2.037) data 0.000 (0.002) loss 1.8995 (1.6072) lr 1.0000e-05 eta 2 days, 7:16:56
epoch [2/50] batch [300/2000] time 2.008 (2.036) data 0.000 (0.002) loss 1.9389 (1.6005) lr 1.0000e-05 eta 2 days, 7:16:05
epoch [2/50] batch [320/2000] time 2.053 (2.036) data 0.000 (0.002) loss 1.2979 (1.6038) lr 1.0000e-05 eta 2 days, 7:14:37
epoch [2/50] batch [340/2000] time 2.008 (2.036) data 0.000 (0.002) loss 1.9978 (1.5998) lr 1.0000e-05 eta 2 days, 7:13:08
epoch [2/50] batch [360/2000] time 2.033 (2.036) data 0.000 (0.002) loss 0.8279 (1.6090) lr 1.0000e-05 eta 2 days, 7:13:14
epoch [2/50] batch [380/2000] time 2.004 (2.036) data 0.000 (0.002) loss 1.1093 (1.6120) lr 1.0000e-05 eta 2 days, 7:12:52
epoch [2/50] batch [400/2000] time 2.059 (2.036) data 0.000 (0.002) loss 0.9304 (1.6236) lr 1.0000e-05 eta 2 days, 7:12:04
epoch [2/50] batch [420/2000] time 2.004 (2.036) data 0.000 (0.002) loss 1.6057 (1.6046) lr 1.0000e-05 eta 2 days, 7:11:55
epoch [2/50] batch [440/2000] time 2.032 (2.036) data 0.000 (0.002) loss 0.4564 (1.5958) lr 1.0000e-05 eta 2 days, 7:11:15
epoch [2/50] batch [460/2000] time 2.056 (2.036) data 0.000 (0.001) loss 0.6445 (1.5871) lr 1.0000e-05 eta 2 days, 7:10:20
epoch [2/50] batch [480/2000] time 2.029 (2.036) data 0.000 (0.001) loss 1.6355 (1.5866) lr 1.0000e-05 eta 2 days, 7:09:19
epoch [2/50] batch [500/2000] time 2.030 (2.036) data 0.000 (0.001) loss 2.5690 (1.5784) lr 1.0000e-05 eta 2 days, 7:08:21
epoch [2/50] batch [520/2000] time 2.000 (2.036) data 0.000 (0.001) loss 0.1451 (1.5744) lr 1.0000e-05 eta 2 days, 7:07:13
epoch [2/50] batch [540/2000] time 2.002 (2.036) data 0.000 (0.001) loss 1.1448 (1.5601) lr 1.0000e-05 eta 2 days, 7:06:24
epoch [2/50] batch [560/2000] time 2.053 (2.036) data 0.000 (0.001) loss 1.1663 (1.5668) lr 1.0000e-05 eta 2 days, 7:06:09
epoch [2/50] batch [580/2000] time 2.061 (2.036) data 0.000 (0.001) loss 2.1612 (1.5686) lr 1.0000e-05 eta 2 days, 7:05:42
epoch [2/50] batch [600/2000] time 2.066 (2.036) data 0.001 (0.001) loss 0.2934 (1.5695) lr 1.0000e-05 eta 2 days, 7:05:04
epoch [2/50] batch [620/2000] time 2.062 (2.036) data 0.000 (0.001) loss 0.5100 (1.5778) lr 1.0000e-05 eta 2 days, 7:04:48
epoch [2/50] batch [640/2000] time 2.062 (2.036) data 0.000 (0.001) loss 0.3744 (1.5700) lr 1.0000e-05 eta 2 days, 7:04:27
epoch [2/50] batch [660/2000] time 2.039 (2.036) data 0.000 (0.001) loss 1.3524 (1.5607) lr 1.0000e-05 eta 2 days, 7:03:24
epoch [2/50] batch [680/2000] time 2.062 (2.036) data 0.000 (0.001) loss 2.9789 (1.5656) lr 1.0000e-05 eta 2 days, 7:03:05
epoch [2/50] batch [700/2000] time 2.036 (2.036) data 0.000 (0.001) loss 1.8384 (1.5671) lr 1.0000e-05 eta 2 days, 7:02:25
epoch [2/50] batch [720/2000] time 2.057 (2.036) data 0.000 (0.001) loss 1.3096 (1.5627) lr 1.0000e-05 eta 2 days, 7:01:21
epoch [2/50] batch [740/2000] time 2.005 (2.036) data 0.000 (0.001) loss 2.5043 (1.5636) lr 1.0000e-05 eta 2 days, 7:00:38
epoch [2/50] batch [760/2000] time 2.054 (2.036) data 0.000 (0.001) loss 3.8435 (1.5673) lr 1.0000e-05 eta 2 days, 7:00:03
epoch [2/50] batch [780/2000] time 2.057 (2.036) data 0.000 (0.001) loss 1.0619 (1.5628) lr 1.0000e-05 eta 2 days, 6:59:15
epoch [2/50] batch [800/2000] time 2.035 (2.036) data 0.000 (0.001) loss 1.1077 (1.5544) lr 1.0000e-05 eta 2 days, 6:58:42
epoch [2/50] batch [820/2000] time 2.061 (2.036) data 0.002 (0.001) loss 1.3668 (1.5605) lr 1.0000e-05 eta 2 days, 6:57:47
epoch [2/50] batch [840/2000] time 2.058 (2.036) data 0.000 (0.001) loss 1.8640 (1.5668) lr 1.0000e-05 eta 2 days, 6:57:10
epoch [2/50] batch [860/2000] time 2.057 (2.036) data 0.000 (0.001) loss 1.5451 (1.5677) lr 1.0000e-05 eta 2 days, 6:56:36
epoch [2/50] batch [880/2000] time 2.060 (2.036) data 0.000 (0.001) loss 1.4016 (1.5678) lr 1.0000e-05 eta 2 days, 6:55:54
epoch [2/50] batch [900/2000] time 2.005 (2.036) data 0.000 (0.001) loss 0.5163 (1.5712) lr 1.0000e-05 eta 2 days, 6:55:20
epoch [2/50] batch [920/2000] time 2.039 (2.036) data 0.000 (0.001) loss 2.1725 (1.5704) lr 1.0000e-05 eta 2 days, 6:54:35
epoch [2/50] batch [940/2000] time 2.058 (2.036) data 0.000 (0.001) loss 2.4824 (1.5749) lr 1.0000e-05 eta 2 days, 6:53:57
epoch [2/50] batch [960/2000] time 2.035 (2.036) data 0.000 (0.001) loss 2.3986 (1.5769) lr 1.0000e-05 eta 2 days, 6:53:10
epoch [2/50] batch [980/2000] time 2.033 (2.036) data 0.000 (0.001) loss 2.2189 (1.5772) lr 1.0000e-05 eta 2 days, 6:52:25
epoch [2/50] batch [1000/2000] time 2.010 (2.036) data 0.000 (0.001) loss 0.9224 (1.5821) lr 1.0000e-05 eta 2 days, 6:51:53
epoch [2/50] batch [1020/2000] time 2.005 (2.036) data 0.000 (0.001) loss 2.3782 (1.5767) lr 1.0000e-05 eta 2 days, 6:51:06
epoch [2/50] batch [1040/2000] time 2.037 (2.036) data 0.000 (0.001) loss 3.4778 (1.5709) lr 1.0000e-05 eta 2 days, 6:50:32
epoch [2/50] batch [1060/2000] time 2.033 (2.036) data 0.000 (0.001) loss 1.1114 (1.5747) lr 1.0000e-05 eta 2 days, 6:49:56
epoch [2/50] batch [1080/2000] time 2.004 (2.036) data 0.000 (0.001) loss 2.0009 (1.5807) lr 1.0000e-05 eta 2 days, 6:49:15
epoch [2/50] batch [1100/2000] time 2.036 (2.036) data 0.000 (0.001) loss 1.8239 (1.5764) lr 1.0000e-05 eta 2 days, 6:48:17
epoch [2/50] batch [1120/2000] time 2.056 (2.036) data 0.000 (0.001) loss 1.6344 (1.5731) lr 1.0000e-05 eta 2 days, 6:47:20
epoch [2/50] batch [1140/2000] time 2.057 (2.036) data 0.001 (0.001) loss 2.8712 (1.5782) lr 1.0000e-05 eta 2 days, 6:46:33
epoch [2/50] batch [1160/2000] time 1.982 (2.036) data 0.000 (0.001) loss 1.1816 (1.5761) lr 1.0000e-05 eta 2 days, 6:45:53
epoch [2/50] batch [1180/2000] time 2.033 (2.036) data 0.000 (0.001) loss 1.0349 (1.5789) lr 1.0000e-05 eta 2 days, 6:45:13
epoch [2/50] batch [1200/2000] time 2.004 (2.036) data 0.000 (0.001) loss 0.8449 (1.5800) lr 1.0000e-05 eta 2 days, 6:44:27
epoch [2/50] batch [1220/2000] time 2.032 (2.036) data 0.000 (0.001) loss 2.3650 (1.5830) lr 1.0000e-05 eta 2 days, 6:43:43
epoch [2/50] batch [1240/2000] time 2.004 (2.036) data 0.000 (0.001) loss 1.4022 (1.5823) lr 1.0000e-05 eta 2 days, 6:43:08
epoch [2/50] batch [1260/2000] time 2.056 (2.036) data 0.000 (0.001) loss 0.5791 (1.5794) lr 1.0000e-05 eta 2 days, 6:42:34
epoch [2/50] batch [1280/2000] time 2.038 (2.036) data 0.000 (0.001) loss 1.2124 (1.5784) lr 1.0000e-05 eta 2 days, 6:41:56
epoch [2/50] batch [1300/2000] time 2.032 (2.036) data 0.000 (0.001) loss 2.0180 (1.5717) lr 1.0000e-05 eta 2 days, 6:41:25
epoch [2/50] batch [1320/2000] time 2.059 (2.036) data 0.000 (0.001) loss 1.5406 (1.5727) lr 1.0000e-05 eta 2 days, 6:40:46
epoch [2/50] batch [1340/2000] time 1.987 (2.036) data 0.000 (0.001) loss 0.6122 (1.5724) lr 1.0000e-05 eta 2 days, 6:39:58
epoch [2/50] batch [1360/2000] time 2.059 (2.036) data 0.000 (0.001) loss 5.0952 (1.5773) lr 1.0000e-05 eta 2 days, 6:39:10
epoch [2/50] batch [1380/2000] time 2.059 (2.036) data 0.000 (0.001) loss 0.5091 (1.5770) lr 1.0000e-05 eta 2 days, 6:38:24
epoch [2/50] batch [1400/2000] time 2.014 (2.036) data 0.000 (0.001) loss 0.6973 (1.5736) lr 1.0000e-05 eta 2 days, 6:37:43
epoch [2/50] batch [1420/2000] time 2.003 (2.036) data 0.000 (0.001) loss 3.0998 (1.5744) lr 1.0000e-05 eta 2 days, 6:36:52
epoch [2/50] batch [1440/2000] time 2.040 (2.036) data 0.000 (0.001) loss 2.7386 (1.5714) lr 1.0000e-05 eta 2 days, 6:36:10
epoch [2/50] batch [1460/2000] time 2.009 (2.036) data 0.000 (0.001) loss 1.9325 (1.5711) lr 1.0000e-05 eta 2 days, 6:35:33
epoch [2/50] batch [1480/2000] time 2.058 (2.036) data 0.000 (0.001) loss 2.0474 (1.5667) lr 1.0000e-05 eta 2 days, 6:35:04
epoch [2/50] batch [1500/2000] time 2.005 (2.036) data 0.000 (0.001) loss 0.8334 (1.5648) lr 1.0000e-05 eta 2 days, 6:34:19
epoch [2/50] batch [1520/2000] time 2.007 (2.036) data 0.000 (0.001) loss 1.6876 (1.5655) lr 1.0000e-05 eta 2 days, 6:33:30
epoch [2/50] batch [1540/2000] time 2.004 (2.036) data 0.000 (0.001) loss 1.0063 (1.5657) lr 1.0000e-05 eta 2 days, 6:32:47
epoch [2/50] batch [1560/2000] time 1.982 (2.036) data 0.000 (0.001) loss 0.1595 (1.5669) lr 1.0000e-05 eta 2 days, 6:32:05
epoch [2/50] batch [1580/2000] time 2.029 (2.036) data 0.000 (0.001) loss 1.3538 (1.5625) lr 1.0000e-05 eta 2 days, 6:31:19
epoch [2/50] batch [1600/2000] time 2.033 (2.036) data 0.000 (0.001) loss 0.5593 (1.5609) lr 1.0000e-05 eta 2 days, 6:30:25
epoch [2/50] batch [1620/2000] time 1.996 (2.035) data 0.000 (0.001) loss 2.5817 (1.5637) lr 1.0000e-05 eta 2 days, 6:29:33
epoch [2/50] batch [1640/2000] time 2.032 (2.035) data 0.000 (0.001) loss 1.3246 (1.5666) lr 1.0000e-05 eta 2 days, 6:28:51
epoch [2/50] batch [1660/2000] time 2.005 (2.035) data 0.000 (0.001) loss 1.3452 (1.5680) lr 1.0000e-05 eta 2 days, 6:28:09
epoch [2/50] batch [1680/2000] time 1.984 (2.035) data 0.001 (0.001) loss 1.3759 (1.5686) lr 1.0000e-05 eta 2 days, 6:27:33
epoch [2/50] batch [1700/2000] time 2.059 (2.036) data 0.000 (0.001) loss 1.4901 (1.5657) lr 1.0000e-05 eta 2 days, 6:27:05
epoch [2/50] batch [1720/2000] time 2.007 (2.036) data 0.000 (0.001) loss 0.8758 (1.5642) lr 1.0000e-05 eta 2 days, 6:26:24
epoch [2/50] batch [1740/2000] time 2.036 (2.036) data 0.000 (0.001) loss 0.9876 (1.5677) lr 1.0000e-05 eta 2 days, 6:25:50
epoch [2/50] batch [1760/2000] time 2.066 (2.036) data 0.000 (0.001) loss 2.8792 (1.5639) lr 1.0000e-05 eta 2 days, 6:25:09
epoch [2/50] batch [1780/2000] time 2.058 (2.036) data 0.000 (0.001) loss 0.2783 (1.5632) lr 1.0000e-05 eta 2 days, 6:24:31
epoch [2/50] batch [1800/2000] time 2.057 (2.036) data 0.000 (0.001) loss 0.2185 (1.5614) lr 1.0000e-05 eta 2 days, 6:23:48
epoch [2/50] batch [1820/2000] time 2.010 (2.036) data 0.000 (0.001) loss 1.7895 (1.5600) lr 1.0000e-05 eta 2 days, 6:23:05
epoch [2/50] batch [1840/2000] time 2.035 (2.036) data 0.000 (0.001) loss 2.0554 (1.5586) lr 1.0000e-05 eta 2 days, 6:22:27
epoch [2/50] batch [1860/2000] time 2.035 (2.036) data 0.000 (0.001) loss 0.9085 (1.5558) lr 1.0000e-05 eta 2 days, 6:21:45
epoch [2/50] batch [1880/2000] time 2.062 (2.036) data 0.000 (0.001) loss 4.0501 (1.5549) lr 1.0000e-05 eta 2 days, 6:21:07
epoch [2/50] batch [1900/2000] time 2.055 (2.036) data 0.000 (0.001) loss 0.7141 (1.5510) lr 1.0000e-05 eta 2 days, 6:20:28
epoch [2/50] batch [1920/2000] time 2.057 (2.036) data 0.000 (0.001) loss 1.1612 (1.5511) lr 1.0000e-05 eta 2 days, 6:19:50
epoch [2/50] batch [1940/2000] time 2.037 (2.036) data 0.000 (0.001) loss 0.5333 (1.5482) lr 1.0000e-05 eta 2 days, 6:19:09
epoch [2/50] batch [1960/2000] time 2.056 (2.036) data 0.000 (0.001) loss 0.3130 (1.5477) lr 1.0000e-05 eta 2 days, 6:18:32
epoch [2/50] batch [1980/2000] time 2.005 (2.036) data 0.000 (0.001) loss 2.9548 (1.5472) lr 1.0000e-05 eta 2 days, 6:17:55
epoch [2/50] batch [2000/2000] time 2.060 (2.036) data 0.000 (0.001) loss 0.7854 (1.5458) lr 1.0000e-05 eta 2 days, 6:17:12
epoch [3/50] batch [20/2000] time 2.054 (2.067) data 0.000 (0.028) loss 0.2016 (1.4221) lr 1.0000e-05 eta 2 days, 7:06:48
epoch [3/50] batch [40/2000] time 2.053 (2.053) data 0.000 (0.014) loss 0.9036 (1.5278) lr 1.0000e-05 eta 2 days, 6:42:38
epoch [3/50] batch [60/2000] time 2.035 (2.047) data 0.000 (0.010) loss 3.5011 (1.6021) lr 1.0000e-05 eta 2 days, 6:32:22
epoch [3/50] batch [80/2000] time 2.008 (2.043) data 0.000 (0.007) loss 1.5685 (1.5722) lr 1.0000e-05 eta 2 days, 6:26:47
epoch [3/50] batch [100/2000] time 2.062 (2.042) data 0.000 (0.006) loss 3.2196 (1.5998) lr 1.0000e-05 eta 2 days, 6:23:47
epoch [3/50] batch [120/2000] time 2.056 (2.042) data 0.000 (0.005) loss 0.8945 (1.5775) lr 1.0000e-05 eta 2 days, 6:22:36
epoch [3/50] batch [140/2000] time 2.002 (2.041) data 0.000 (0.004) loss 0.8074 (1.5630) lr 1.0000e-05 eta 2 days, 6:20:33
epoch [3/50] batch [160/2000] time 2.057 (2.040) data 0.000 (0.004) loss 0.1731 (1.6539) lr 1.0000e-05 eta 2 days, 6:19:18
epoch [3/50] batch [180/2000] time 2.060 (2.040) data 0.000 (0.003) loss 3.6012 (1.5899) lr 1.0000e-05 eta 2 days, 6:18:07
epoch [3/50] batch [200/2000] time 2.030 (2.040) data 0.000 (0.003) loss 2.0918 (1.5938) lr 1.0000e-05 eta 2 days, 6:16:36
epoch [3/50] batch [220/2000] time 1.999 (2.039) data 0.000 (0.003) loss 1.3655 (1.5979) lr 1.0000e-05 eta 2 days, 6:15:37
epoch [3/50] batch [240/2000] time 1.984 (2.038) data 0.000 (0.003) loss 0.6118 (1.6025) lr 1.0000e-05 eta 2 days, 6:13:01
epoch [3/50] batch [260/2000] time 2.064 (2.038) data 0.000 (0.002) loss 1.1362 (1.5956) lr 1.0000e-05 eta 2 days, 6:12:14
epoch [3/50] batch [280/2000] time 2.037 (2.038) data 0.000 (0.002) loss 2.6191 (1.5941) lr 1.0000e-05 eta 2 days, 6:10:56
epoch [3/50] batch [300/2000] time 2.035 (2.038) data 0.000 (0.002) loss 2.5642 (1.5997) lr 1.0000e-05 eta 2 days, 6:09:53
epoch [3/50] batch [320/2000] time 2.037 (2.037) data 0.000 (0.002) loss 2.4558 (1.5868) lr 1.0000e-05 eta 2 days, 6:09:00
epoch [3/50] batch [340/2000] time 2.006 (2.037) data 0.000 (0.002) loss 2.3643 (1.5838) lr 1.0000e-05 eta 2 days, 6:08:12
epoch [3/50] batch [360/2000] time 2.009 (2.037) data 0.000 (0.002) loss 1.5301 (1.5730) lr 1.0000e-05 eta 2 days, 6:07:12
epoch [3/50] batch [380/2000] time 2.003 (2.037) data 0.000 (0.002) loss 1.6883 (1.5752) lr 1.0000e-05 eta 2 days, 6:06:35
epoch [3/50] batch [400/2000] time 2.040 (2.037) data 0.000 (0.002) loss 0.7872 (1.5667) lr 1.0000e-05 eta 2 days, 6:05:58
epoch [3/50] batch [420/2000] time 2.004 (2.037) data 0.000 (0.002) loss 0.0686 (1.5616) lr 1.0000e-05 eta 2 days, 6:05:24
epoch [3/50] batch [440/2000] time 2.002 (2.037) data 0.000 (0.002) loss 1.2131 (1.5361) lr 1.0000e-05 eta 2 days, 6:04:06
epoch [3/50] batch [460/2000] time 2.011 (2.037) data 0.000 (0.001) loss 0.5570 (1.5344) lr 1.0000e-05 eta 2 days, 6:03:43
epoch [3/50] batch [480/2000] time 2.050 (2.037) data 0.000 (0.001) loss 1.2461 (1.5401) lr 1.0000e-05 eta 2 days, 6:03:30
epoch [3/50] batch [500/2000] time 2.065 (2.037) data 0.000 (0.001) loss 2.8750 (1.5269) lr 1.0000e-05 eta 2 days, 6:02:34
epoch [3/50] batch [520/2000] time 2.056 (2.037) data 0.000 (0.001) loss 2.8008 (1.5253) lr 1.0000e-05 eta 2 days, 6:02:00
epoch [3/50] batch [540/2000] time 2.003 (2.037) data 0.000 (0.001) loss 2.1528 (1.5207) lr 1.0000e-05 eta 2 days, 6:01:06
epoch [3/50] batch [560/2000] time 2.035 (2.037) data 0.000 (0.001) loss 0.7902 (1.5369) lr 1.0000e-05 eta 2 days, 6:00:12
epoch [3/50] batch [580/2000] time 2.030 (2.037) data 0.000 (0.001) loss 0.4591 (1.5233) lr 1.0000e-05 eta 2 days, 5:59:27
epoch [3/50] batch [600/2000] time 2.027 (2.037) data 0.001 (0.001) loss 1.0660 (1.5207) lr 1.0000e-05 eta 2 days, 5:58:48
epoch [3/50] batch [620/2000] time 2.065 (2.037) data 0.000 (0.001) loss 0.9433 (1.5157) lr 1.0000e-05 eta 2 days, 5:57:55
epoch [3/50] batch [640/2000] time 2.056 (2.037) data 0.000 (0.001) loss 0.9775 (1.5052) lr 1.0000e-05 eta 2 days, 5:57:25
epoch [3/50] batch [660/2000] time 2.029 (2.037) data 0.000 (0.001) loss 0.7109 (1.5072) lr 1.0000e-05 eta 2 days, 5:56:59
epoch [3/50] batch [680/2000] time 2.047 (2.037) data 0.000 (0.001) loss 0.2631 (1.5029) lr 1.0000e-05 eta 2 days, 5:56:04
epoch [3/50] batch [700/2000] time 2.002 (2.037) data 0.000 (0.001) loss 2.3958 (1.5065) lr 1.0000e-05 eta 2 days, 5:55:27
epoch [3/50] batch [720/2000] time 2.034 (2.037) data 0.000 (0.001) loss 0.8974 (1.5111) lr 1.0000e-05 eta 2 days, 5:54:58
epoch [3/50] batch [740/2000] time 2.041 (2.037) data 0.000 (0.001) loss 2.7351 (1.5100) lr 1.0000e-05 eta 2 days, 5:54:24
epoch [3/50] batch [760/2000] time 1.988 (2.037) data 0.000 (0.001) loss 0.8689 (1.5050) lr 1.0000e-05 eta 2 days, 5:53:39
epoch [3/50] batch [780/2000] time 2.037 (2.037) data 0.000 (0.001) loss 1.3635 (1.4976) lr 1.0000e-05 eta 2 days, 5:52:48
epoch [3/50] batch [800/2000] time 2.003 (2.037) data 0.000 (0.001) loss 0.1525 (1.4980) lr 1.0000e-05 eta 2 days, 5:52:25
epoch [3/50] batch [820/2000] time 2.062 (2.037) data 0.000 (0.001) loss 0.7837 (1.5002) lr 1.0000e-05 eta 2 days, 5:51:39
epoch [3/50] batch [840/2000] time 2.036 (2.037) data 0.000 (0.001) loss 1.2140 (1.4934) lr 1.0000e-05 eta 2 days, 5:51:03
epoch [3/50] batch [860/2000] time 1.982 (2.037) data 0.000 (0.001) loss 1.2970 (1.4948) lr 1.0000e-05 eta 2 days, 5:50:16
epoch [3/50] batch [880/2000] time 2.063 (2.037) data 0.000 (0.001) loss 0.4884 (1.4915) lr 1.0000e-05 eta 2 days, 5:49:41
epoch [3/50] batch [900/2000] time 2.001 (2.037) data 0.000 (0.001) loss 1.1238 (1.4930) lr 1.0000e-05 eta 2 days, 5:48:57
epoch [3/50] batch [920/2000] time 2.048 (2.037) data 0.004 (0.001) loss 0.8773 (1.4927) lr 1.0000e-05 eta 2 days, 5:48:17
epoch [3/50] batch [940/2000] time 2.006 (2.037) data 0.000 (0.001) loss 1.3916 (1.4909) lr 1.0000e-05 eta 2 days, 5:47:41
epoch [3/50] batch [960/2000] time 2.055 (2.038) data 0.000 (0.001) loss 1.2522 (1.4853) lr 1.0000e-05 eta 2 days, 5:47:28
epoch [3/50] batch [980/2000] time 2.005 (2.037) data 0.000 (0.001) loss 1.0080 (1.4740) lr 1.0000e-05 eta 2 days, 5:46:19
epoch [3/50] batch [1000/2000] time 2.039 (2.037) data 0.000 (0.001) loss 3.3730 (1.4741) lr 1.0000e-05 eta 2 days, 5:45:47
epoch [3/50] batch [1020/2000] time 2.053 (2.037) data 0.000 (0.001) loss 2.0099 (1.4735) lr 1.0000e-05 eta 2 days, 5:45:12
epoch [3/50] batch [1040/2000] time 2.009 (2.037) data 0.000 (0.001) loss 0.0814 (1.4738) lr 1.0000e-05 eta 2 days, 5:44:31
epoch [3/50] batch [1060/2000] time 2.055 (2.037) data 0.000 (0.001) loss 1.0120 (1.4782) lr 1.0000e-05 eta 2 days, 5:43:40
epoch [3/50] batch [1080/2000] time 2.054 (2.037) data 0.000 (0.001) loss 0.6121 (1.4810) lr 1.0000e-05 eta 2 days, 5:42:53
epoch [3/50] batch [1100/2000] time 2.007 (2.037) data 0.000 (0.001) loss 2.0157 (1.4844) lr 1.0000e-05 eta 2 days, 5:42:07
epoch [3/50] batch [1120/2000] time 2.032 (2.037) data 0.000 (0.001) loss 2.2967 (1.4906) lr 1.0000e-05 eta 2 days, 5:41:26
epoch [3/50] batch [1140/2000] time 2.051 (2.037) data 0.001 (0.001) loss 1.1882 (1.4908) lr 1.0000e-05 eta 2 days, 5:40:43
epoch [3/50] batch [1160/2000] time 2.028 (2.037) data 0.000 (0.001) loss 0.5696 (1.4888) lr 1.0000e-05 eta 2 days, 5:39:54
epoch [3/50] batch [1180/2000] time 2.053 (2.037) data 0.000 (0.001) loss 0.1552 (1.4865) lr 1.0000e-05 eta 2 days, 5:39:12
epoch [3/50] batch [1200/2000] time 2.053 (2.037) data 0.000 (0.001) loss 0.6605 (1.4797) lr 1.0000e-05 eta 2 days, 5:38:21
epoch [3/50] batch [1220/2000] time 2.030 (2.037) data 0.000 (0.001) loss 1.8428 (1.4770) lr 1.0000e-05 eta 2 days, 5:37:22
epoch [3/50] batch [1240/2000] time 2.058 (2.037) data 0.000 (0.001) loss 1.1973 (1.4766) lr 1.0000e-05 eta 2 days, 5:36:34
epoch [3/50] batch [1260/2000] time 2.034 (2.037) data 0.000 (0.001) loss 2.0978 (1.4745) lr 1.0000e-05 eta 2 days, 5:35:55
epoch [3/50] batch [1280/2000] time 2.062 (2.037) data 0.000 (0.001) loss 1.7389 (1.4761) lr 1.0000e-05 eta 2 days, 5:35:23
epoch [3/50] batch [1300/2000] time 2.068 (2.037) data 0.000 (0.001) loss 1.2300 (1.4736) lr 1.0000e-05 eta 2 days, 5:35:01
epoch [3/50] batch [1320/2000] time 2.035 (2.037) data 0.000 (0.001) loss 0.5677 (1.4757) lr 1.0000e-05 eta 2 days, 5:34:31
epoch [3/50] batch [1340/2000] time 2.095 (2.037) data 0.000 (0.001) loss 1.0594 (1.4742) lr 1.0000e-05 eta 2 days, 5:34:02
epoch [3/50] batch [1360/2000] time 1.980 (2.037) data 0.000 (0.001) loss 0.6335 (1.4761) lr 1.0000e-05 eta 2 days, 5:33:22
epoch [3/50] batch [1380/2000] time 2.055 (2.037) data 0.000 (0.001) loss 2.1916 (1.4719) lr 1.0000e-05 eta 2 days, 5:32:44
epoch [3/50] batch [1400/2000] time 2.003 (2.037) data 0.000 (0.001) loss 2.1596 (1.4701) lr 1.0000e-05 eta 2 days, 5:32:10
epoch [3/50] batch [1420/2000] time 2.033 (2.037) data 0.000 (0.001) loss 0.6316 (1.4659) lr 1.0000e-05 eta 2 days, 5:31:31
epoch [3/50] batch [1440/2000] time 2.057 (2.037) data 0.000 (0.001) loss 0.7993 (1.4711) lr 1.0000e-05 eta 2 days, 5:30:56
epoch [3/50] batch [1460/2000] time 1.986 (2.037) data 0.000 (0.001) loss 2.2529 (1.4682) lr 1.0000e-05 eta 2 days, 5:30:20
epoch [3/50] batch [1480/2000] time 2.036 (2.037) data 0.000 (0.001) loss 1.9075 (1.4675) lr 1.0000e-05 eta 2 days, 5:29:40
epoch [3/50] batch [1500/2000] time 2.058 (2.038) data 0.000 (0.001) loss 1.7119 (1.4682) lr 1.0000e-05 eta 2 days, 5:29:03
epoch [3/50] batch [1520/2000] time 2.034 (2.037) data 0.000 (0.001) loss 0.1569 (1.4623) lr 1.0000e-05 eta 2 days, 5:28:20
epoch [3/50] batch [1540/2000] time 2.062 (2.037) data 0.000 (0.001) loss 1.4852 (1.4609) lr 1.0000e-05 eta 2 days, 5:27:37
epoch [3/50] batch [1560/2000] time 2.397 (2.040) data 0.000 (0.001) loss 1.0063 (1.4689) lr 1.0000e-05 eta 2 days, 5:31:38
epoch [3/50] batch [1580/2000] time 1.986 (2.045) data 0.000 (0.001) loss 1.7514 (1.4663) lr 1.0000e-05 eta 2 days, 5:37:28
epoch [3/50] batch [1600/2000] time 3.729 (2.054) data 0.000 (0.001) loss 2.6902 (1.4667) lr 1.0000e-05 eta 2 days, 5:51:17
epoch [3/50] batch [1620/2000] time 3.725 (2.069) data 0.000 (0.001) loss 1.8199 (1.4694) lr 1.0000e-05 eta 2 days, 6:14:01
epoch [3/50] batch [1640/2000] time 2.857 (2.083) data 0.000 (0.001) loss 2.5961 (1.4708) lr 1.0000e-05 eta 2 days, 6:36:01
epoch [3/50] batch [1660/2000] time 2.252 (2.096) data 0.000 (0.001) loss 1.1071 (1.4674) lr 1.0000e-05 eta 2 days, 6:56:10
epoch [3/50] batch [1680/2000] time 2.097 (2.101) data 0.001 (0.001) loss 0.6430 (1.4701) lr 1.0000e-05 eta 2 days, 7:02:45
epoch [3/50] batch [1700/2000] time 4.325 (2.116) data 0.000 (0.001) loss 0.7460 (1.4654) lr 1.0000e-05 eta 2 days, 7:24:55
epoch [3/50] batch [1720/2000] time 4.296 (2.141) data 0.000 (0.001) loss 0.2350 (1.4659) lr 1.0000e-05 eta 2 days, 8:04:00
epoch [3/50] batch [1740/2000] time 4.264 (2.168) data 0.004 (0.001) loss 0.5923 (1.4715) lr 1.0000e-05 eta 2 days, 8:45:49
epoch [3/50] batch [1760/2000] time 4.513 (2.199) data 0.000 (0.001) loss 0.8395 (1.4733) lr 1.0000e-05 eta 2 days, 9:34:01
epoch [3/50] batch [1780/2000] time 5.028 (2.236) data 0.000 (0.001) loss 0.5762 (1.4687) lr 1.0000e-05 eta 2 days, 10:31:33
epoch [3/50] batch [1800/2000] time 5.073 (2.273) data 0.000 (0.001) loss 1.5652 (1.4660) lr 1.0000e-05 eta 2 days, 11:28:07
epoch [3/50] batch [1820/2000] time 5.116 (2.301) data 0.000 (0.001) loss 1.7899 (1.4683) lr 1.0000e-05 eta 2 days, 12:12:23
epoch [3/50] batch [1840/2000] time 5.633 (2.323) data 0.000 (0.001) loss 0.4449 (1.4672) lr 1.0000e-05 eta 2 days, 12:45:26
epoch [3/50] batch [1860/2000] time 4.755 (2.354) data 0.000 (0.001) loss 1.3159 (1.4682) lr 1.0000e-05 eta 2 days, 13:32:52
epoch [3/50] batch [1880/2000] time 5.767 (2.380) data 0.000 (0.001) loss 0.0759 (1.4703) lr 1.0000e-05 eta 2 days, 14:13:08
epoch [3/50] batch [1900/2000] time 5.679 (2.413) data 0.000 (0.001) loss 0.7088 (1.4672) lr 1.0000e-05 eta 2 days, 15:05:09
epoch [3/50] batch [1920/2000] time 5.763 (2.447) data 0.000 (0.001) loss 0.3886 (1.4685) lr 1.0000e-05 eta 2 days, 15:56:19
epoch [3/50] batch [1940/2000] time 5.807 (2.479) data 0.000 (0.001) loss 2.0794 (1.4686) lr 1.0000e-05 eta 2 days, 16:45:59
epoch [3/50] batch [1960/2000] time 4.737 (2.501) data 0.000 (0.001) loss 1.1302 (1.4659) lr 1.0000e-05 eta 2 days, 17:20:19
epoch [3/50] batch [1980/2000] time 5.500 (2.524) data 0.001 (0.001) loss 0.8790 (1.4620) lr 1.0000e-05 eta 2 days, 17:55:18
epoch [3/50] batch [2000/2000] time 5.809 (2.551) data 0.000 (0.001) loss 0.6149 (1.4626) lr 1.0000e-05 eta 2 days, 18:36:25
epoch [4/50] batch [20/2000] time 6.367 (5.662) data 0.000 (0.035) loss 1.6062 (1.7447) lr 1.0000e-05 eta 6 days, 3:47:55
epoch [4/50] batch [40/2000] time 5.618 (5.333) data 0.005 (0.018) loss 1.8965 (1.5805) lr 1.0000e-05 eta 5 days, 19:11:05
epoch [4/50] batch [60/2000] time 4.896 (5.392) data 0.001 (0.012) loss 2.8744 (1.5786) lr 1.0000e-05 eta 5 days, 20:41:55
epoch [4/50] batch [80/2000] time 5.108 (5.428) data 0.001 (0.009) loss 0.7941 (1.5148) lr 1.0000e-05 eta 5 days, 21:36:51
epoch [4/50] batch [100/2000] time 4.383 (5.318) data 0.000 (0.008) loss 0.5640 (1.5349) lr 1.0000e-05 eta 5 days, 18:42:00
epoch [4/50] batch [120/2000] time 6.150 (5.433) data 0.000 (0.007) loss 0.2676 (1.5027) lr 1.0000e-05 eta 5 days, 21:41:02
epoch [4/50] batch [140/2000] time 6.189 (5.515) data 0.000 (0.006) loss 0.9293 (1.5280) lr 1.0000e-05 eta 5 days, 23:47:12
epoch [4/50] batch [160/2000] time 4.977 (5.582) data 0.009 (0.006) loss 0.1372 (1.5048) lr 1.0000e-05 eta 6 days, 1:29:34
epoch [4/50] batch [180/2000] time 6.175 (5.645) data 0.000 (0.005) loss 0.2715 (1.4685) lr 1.0000e-05 eta 6 days, 3:07:16
epoch [4/50] batch [200/2000] time 6.184 (5.685) data 0.001 (0.005) loss 1.2200 (1.4707) lr 1.0000e-05 eta 6 days, 4:07:06
epoch [4/50] batch [220/2000] time 6.142 (5.718) data 0.010 (0.004) loss 2.1175 (1.5062) lr 1.0000e-05 eta 6 days, 4:56:45
epoch [4/50] batch [240/2000] time 6.163 (5.755) data 0.000 (0.004) loss 2.6305 (1.5537) lr 1.0000e-05 eta 6 days, 5:53:20
epoch [4/50] batch [260/2000] time 6.133 (5.778) data 0.000 (0.004) loss 0.9841 (1.5228) lr 1.0000e-05 eta 6 days, 6:27:01
epoch [4/50] batch [280/2000] time 6.275 (5.789) data 0.000 (0.004) loss 0.3188 (1.5212) lr 1.0000e-05 eta 6 days, 6:42:04
epoch [4/50] batch [300/2000] time 6.164 (5.812) data 0.000 (0.004) loss 1.3086 (1.5120) lr 1.0000e-05 eta 6 days, 7:16:45
epoch [4/50] batch [320/2000] time 6.163 (5.826) data 0.000 (0.003) loss 5.3644 (1.5303) lr 1.0000e-05 eta 6 days, 7:35:37
epoch [4/50] batch [340/2000] time 6.171 (5.838) data 0.000 (0.003) loss 1.4738 (1.5349) lr 1.0000e-05 eta 6 days, 7:53:20
epoch [4/50] batch [360/2000] time 6.108 (5.855) data 0.003 (0.003) loss 0.7264 (1.5164) lr 1.0000e-05 eta 6 days, 8:17:17
epoch [4/50] batch [380/2000] time 6.137 (5.865) data 0.001 (0.003) loss 1.5744 (1.5277) lr 1.0000e-05 eta 6 days, 8:31:03
epoch [4/50] batch [400/2000] time 6.127 (5.873) data 0.000 (0.003) loss 0.8365 (1.5399) lr 1.0000e-05 eta 6 days, 8:41:50
epoch [4/50] batch [420/2000] time 5.056 (5.884) data 0.000 (0.003) loss 1.8871 (1.5337) lr 1.0000e-05 eta 6 days, 8:56:39
epoch [4/50] batch [440/2000] time 6.162 (5.894) data 0.000 (0.003) loss 1.7323 (1.5350) lr 1.0000e-05 eta 6 days, 9:10:49
epoch [4/50] batch [460/2000] time 6.109 (5.902) data 0.000 (0.003) loss 0.2011 (1.5528) lr 1.0000e-05 eta 6 days, 9:20:59
epoch [4/50] batch [480/2000] time 6.123 (5.908) data 0.000 (0.002) loss 0.7950 (1.5463) lr 1.0000e-05 eta 6 days, 9:28:05
epoch [4/50] batch [500/2000] time 6.139 (5.918) data 0.000 (0.002) loss 1.9220 (1.5292) lr 1.0000e-05 eta 6 days, 9:41:31
epoch [4/50] batch [520/2000] time 6.088 (5.923) data 0.000 (0.002) loss 2.0724 (1.5327) lr 1.0000e-05 eta 6 days, 9:48:39
epoch [4/50] batch [540/2000] time 6.162 (5.929) data 0.000 (0.002) loss 3.0292 (1.5302) lr 1.0000e-05 eta 6 days, 9:55:26
epoch [4/50] batch [560/2000] time 6.147 (5.937) data 0.005 (0.002) loss 2.6277 (1.5241) lr 1.0000e-05 eta 6 days, 10:06:19
epoch [4/50] batch [580/2000] time 6.341 (5.940) data 0.000 (0.002) loss 1.2430 (1.5126) lr 1.0000e-05 eta 6 days, 10:07:58
epoch [4/50] batch [600/2000] time 6.192 (5.944) data 0.001 (0.002) loss 0.2237 (1.5152) lr 1.0000e-05 eta 6 days, 10:12:53
epoch [4/50] batch [620/2000] time 6.112 (5.951) data 0.000 (0.002) loss 2.0736 (1.5145) lr 1.0000e-05 eta 6 days, 10:21:29
epoch [4/50] batch [640/2000] time 6.145 (5.954) data 0.000 (0.002) loss 0.6340 (1.5085) lr 1.0000e-05 eta 6 days, 10:24:56
epoch [4/50] batch [660/2000] time 4.541 (5.938) data 0.001 (0.002) loss 2.3700 (1.5045) lr 1.0000e-05 eta 6 days, 9:56:50
epoch [4/50] batch [680/2000] time 4.369 (5.896) data 0.002 (0.002) loss 0.6044 (1.5019) lr 1.0000e-05 eta 6 days, 8:50:35
epoch [4/50] batch [700/2000] time 4.272 (5.858) data 0.001 (0.002) loss 0.6820 (1.4972) lr 1.0000e-05 eta 6 days, 7:49:29
epoch [4/50] batch [720/2000] time 5.971 (5.845) data 0.000 (0.002) loss 2.1712 (1.4930) lr 1.0000e-05 eta 6 days, 7:27:13
epoch [4/50] batch [740/2000] time 5.981 (5.844) data 0.000 (0.002) loss 2.3940 (1.4920) lr 1.0000e-05 eta 6 days, 7:24:09
epoch [4/50] batch [760/2000] time 6.019 (5.844) data 0.000 (0.002) loss 1.9257 (1.5019) lr 1.0000e-05 eta 6 days, 7:22:03
epoch [4/50] batch [780/2000] time 5.956 (5.845) data 0.000 (0.002) loss 1.0979 (1.4895) lr 1.0000e-05 eta 6 days, 7:21:13
epoch [4/50] batch [800/2000] time 5.894 (5.845) data 0.000 (0.002) loss 0.4027 (1.4823) lr 1.0000e-05 eta 6 days, 7:19:53
epoch [4/50] batch [820/2000] time 5.342 (5.845) data 0.001 (0.002) loss 0.2242 (1.4864) lr 1.0000e-05 eta 6 days, 7:16:32
epoch [4/50] batch [840/2000] time 5.998 (5.844) data 0.000 (0.002) loss 0.2990 (1.4867) lr 1.0000e-05 eta 6 days, 7:14:22
epoch [4/50] batch [860/2000] time 5.290 (5.826) data 0.000 (0.002) loss 0.9232 (1.4856) lr 1.0000e-05 eta 6 days, 6:44:31
epoch [4/50] batch [880/2000] time 5.690 (5.811) data 0.000 (0.002) loss 1.1666 (1.4794) lr 1.0000e-05 eta 6 days, 6:18:22
epoch [4/50] batch [900/2000] time 5.828 (5.807) data 0.000 (0.002) loss 1.5027 (1.4825) lr 1.0000e-05 eta 6 days, 6:10:47
epoch [4/50] batch [920/2000] time 4.261 (5.798) data 0.000 (0.002) loss 1.4179 (1.4756) lr 1.0000e-05 eta 6 days, 5:55:12
epoch [4/50] batch [940/2000] time 4.213 (5.772) data 0.000 (0.002) loss 2.0873 (1.4733) lr 1.0000e-05 eta 6 days, 5:11:56
epoch [4/50] batch [960/2000] time 5.759 (5.756) data 0.000 (0.002) loss 0.1754 (1.4715) lr 1.0000e-05 eta 6 days, 4:45:13
epoch [4/50] batch [980/2000] time 5.594 (5.751) data 0.000 (0.002) loss 0.5282 (1.4715) lr 1.0000e-05 eta 6 days, 4:35:44
epoch [4/50] batch [1000/2000] time 5.585 (5.746) data 0.000 (0.002) loss 1.1575 (1.4641) lr 1.0000e-05 eta 6 days, 4:26:57
epoch [4/50] batch [1020/2000] time 4.467 (5.729) data 0.000 (0.002) loss 1.7244 (1.4729) lr 1.0000e-05 eta 6 days, 3:57:42
epoch [4/50] batch [1040/2000] time 2.344 (5.704) data 0.001 (0.002) loss 0.1970 (1.4707) lr 1.0000e-05 eta 6 days, 3:16:38
epoch [4/50] batch [1060/2000] time 4.510 (5.690) data 0.012 (0.002) loss 0.3283 (1.4638) lr 1.0000e-05 eta 6 days, 2:54:15
epoch [4/50] batch [1080/2000] time 5.748 (5.680) data 0.002 (0.002) loss 1.4630 (1.4656) lr 1.0000e-05 eta 6 days, 2:35:45
epoch [4/50] batch [1100/2000] time 5.451 (5.677) data 0.001 (0.001) loss 2.4479 (1.4696) lr 1.0000e-05 eta 6 days, 2:30:12
epoch [4/50] batch [1120/2000] time 5.160 (5.675) data 0.000 (0.001) loss 0.1037 (1.4703) lr 1.0000e-05 eta 6 days, 2:25:29
epoch [4/50] batch [1140/2000] time 5.444 (5.660) data 0.001 (0.001) loss 2.4326 (1.4724) lr 1.0000e-05 eta 6 days, 1:59:31
epoch [4/50] batch [1160/2000] time 4.298 (5.644) data 0.002 (0.001) loss 1.3447 (1.4687) lr 1.0000e-05 eta 6 days, 1:33:49
epoch [4/50] batch [1180/2000] time 5.808 (5.638) data 0.000 (0.001) loss 0.8252 (1.4607) lr 1.0000e-05 eta 6 days, 1:21:31
epoch [4/50] batch [1200/2000] time 5.755 (5.637) data 0.000 (0.001) loss 3.1133 (1.4575) lr 1.0000e-05 eta 6 days, 1:18:31
epoch [4/50] batch [1220/2000] time 4.380 (5.628) data 0.001 (0.001) loss 1.8721 (1.4602) lr 1.0000e-05 eta 6 days, 1:03:13
epoch [4/50] batch [1240/2000] time 5.772 (5.627) data 0.000 (0.001) loss 1.5022 (1.4639) lr 1.0000e-05 eta 6 days, 0:58:53
epoch [4/50] batch [1260/2000] time 5.749 (5.626) data 0.001 (0.001) loss 3.4357 (1.4653) lr 1.0000e-05 eta 6 days, 0:55:10
epoch [4/50] batch [1280/2000] time 5.750 (5.624) data 0.000 (0.001) loss 1.4372 (1.4647) lr 1.0000e-05 eta 6 days, 0:51:12
epoch [4/50] batch [1300/2000] time 4.280 (5.622) data 0.000 (0.001) loss 0.1683 (1.4644) lr 1.0000e-05 eta 6 days, 0:45:15
epoch [4/50] batch [1320/2000] time 6.172 (5.614) data 0.000 (0.001) loss 2.3071 (1.4592) lr 1.0000e-05 eta 6 days, 0:31:06
epoch [4/50] batch [1340/2000] time 5.278 (5.621) data 0.001 (0.001) loss 1.5431 (1.4622) lr 1.0000e-05 eta 6 days, 0:41:08
epoch [4/50] batch [1360/2000] time 6.188 (5.628) data 0.000 (0.001) loss 1.3753 (1.4593) lr 1.0000e-05 eta 6 days, 0:50:23
epoch [4/50] batch [1380/2000] time 6.179 (5.635) data 0.000 (0.001) loss 1.6032 (1.4566) lr 1.0000e-05 eta 6 days, 0:58:08
epoch [4/50] batch [1400/2000] time 6.344 (5.642) data 0.000 (0.001) loss 0.5422 (1.4602) lr 1.0000e-05 eta 6 days, 1:06:57
epoch [4/50] batch [1420/2000] time 6.387 (5.652) data 0.000 (0.001) loss 2.0396 (1.4616) lr 1.0000e-05 eta 6 days, 1:20:40
epoch [4/50] batch [1440/2000] time 6.341 (5.660) data 0.000 (0.001) loss 0.2743 (1.4620) lr 1.0000e-05 eta 6 days, 1:31:42
epoch [4/50] batch [1460/2000] time 6.314 (5.668) data 0.000 (0.001) loss 1.9976 (1.4594) lr 1.0000e-05 eta 6 days, 1:42:11
epoch [4/50] batch [1480/2000] time 5.438 (5.677) data 0.000 (0.001) loss 0.2847 (1.4572) lr 1.0000e-05 eta 6 days, 1:53:28
epoch [4/50] batch [1500/2000] time 6.515 (5.685) data 0.000 (0.001) loss 1.2627 (1.4586) lr 1.0000e-05 eta 6 days, 2:04:20
epoch [4/50] batch [1520/2000] time 5.683 (5.676) data 0.000 (0.001) loss 1.1979 (1.4648) lr 1.0000e-05 eta 6 days, 1:49:14
epoch [4/50] batch [1540/2000] time 5.707 (5.669) data 0.000 (0.001) loss 1.9528 (1.4650) lr 1.0000e-05 eta 6 days, 1:35:58
epoch [4/50] batch [1560/2000] time 4.278 (5.659) data 0.000 (0.001) loss 0.4121 (1.4632) lr 1.0000e-05 eta 6 days, 1:19:21
epoch [4/50] batch [1580/2000] time 5.703 (5.650) data 0.000 (0.001) loss 1.0133 (1.4596) lr 1.0000e-05 eta 6 days, 1:02:43
epoch [4/50] batch [1600/2000] time 5.828 (5.649) data 0.000 (0.001) loss 2.4544 (1.4616) lr 1.0000e-05 eta 6 days, 0:59:12
epoch [4/50] batch [1620/2000] time 4.506 (5.643) data 0.001 (0.001) loss 2.7623 (1.4625) lr 1.0000e-05 eta 6 days, 0:48:46
epoch [4/50] batch [1640/2000] time 4.537 (5.632) data 0.000 (0.001) loss 1.1029 (1.4600) lr 1.0000e-05 eta 6 days, 0:30:05
epoch [4/50] batch [1660/2000] time 4.503 (5.622) data 0.015 (0.001) loss 0.5560 (1.4594) lr 1.0000e-05 eta 6 days, 0:11:32
epoch [4/50] batch [1680/2000] time 6.339 (5.622) data 0.001 (0.001) loss 2.6564 (1.4617) lr 1.0000e-05 eta 6 days, 0:10:46
epoch [4/50] batch [1700/2000] time 5.797 (5.613) data 0.001 (0.001) loss 1.2351 (1.4596) lr 1.0000e-05 eta 5 days, 23:55:03
epoch [4/50] batch [1720/2000] time 5.592 (5.611) data 0.001 (0.001) loss 0.1296 (1.4638) lr 1.0000e-05 eta 5 days, 23:50:28
epoch [4/50] batch [1740/2000] time 5.219 (5.611) data 0.000 (0.001) loss 0.0687 (1.4636) lr 1.0000e-05 eta 5 days, 23:47:58
epoch [4/50] batch [1760/2000] time 4.330 (5.602) data 0.000 (0.001) loss 1.6938 (1.4622) lr 1.0000e-05 eta 5 days, 23:31:43
epoch [4/50] batch [1780/2000] time 6.124 (5.606) data 0.000 (0.001) loss 1.4038 (1.4636) lr 1.0000e-05 eta 5 days, 23:36:07
epoch [4/50] batch [1800/2000] time 6.142 (5.611) data 0.000 (0.001) loss 0.0390 (1.4680) lr 1.0000e-05 eta 5 days, 23:42:24
epoch [4/50] batch [1820/2000] time 3.170 (5.602) data 0.001 (0.001) loss 0.1401 (1.4700) lr 1.0000e-05 eta 5 days, 23:26:52
epoch [4/50] batch [1840/2000] time 4.847 (5.592) data 0.000 (0.001) loss 0.3752 (1.4698) lr 1.0000e-05 eta 5 days, 23:09:01
epoch [4/50] batch [1860/2000] time 6.037 (5.588) data 0.000 (0.001) loss 2.9913 (1.4733) lr 1.0000e-05 eta 5 days, 23:01:35
epoch [4/50] batch [1880/2000] time 5.627 (5.590) data 0.000 (0.001) loss 1.6040 (1.4728) lr 1.0000e-05 eta 5 days, 23:02:26
epoch [4/50] batch [1900/2000] time 5.949 (5.593) data 0.000 (0.001) loss 0.8863 (1.4744) lr 1.0000e-05 eta 5 days, 23:05:24
epoch [4/50] batch [1920/2000] time 5.992 (5.595) data 0.000 (0.001) loss 0.4545 (1.4726) lr 1.0000e-05 eta 5 days, 23:06:16
epoch [4/50] batch [1940/2000] time 5.988 (5.597) data 0.000 (0.001) loss 2.5341 (1.4725) lr 1.0000e-05 eta 5 days, 23:07:37
epoch [4/50] batch [1960/2000] time 5.892 (5.600) data 0.000 (0.001) loss 0.1289 (1.4721) lr 1.0000e-05 eta 5 days, 23:09:47
epoch [4/50] batch [1980/2000] time 5.445 (5.601) data 0.000 (0.001) loss 2.4199 (1.4716) lr 1.0000e-05 eta 5 days, 23:10:19
epoch [4/50] batch [2000/2000] time 5.304 (5.595) data 0.000 (0.001) loss 0.6651 (1.4674) lr 1.0000e-05 eta 5 days, 22:59:13
epoch [5/50] batch [20/2000] time 5.816 (5.413) data 0.000 (0.032) loss 0.6772 (1.5650) lr 1.0000e-05 eta 5 days, 18:18:01
epoch [5/50] batch [40/2000] time 4.531 (5.178) data 0.000 (0.017) loss 0.2555 (1.4481) lr 1.0000e-05 eta 5 days, 12:16:38
epoch [5/50] batch [60/2000] time 4.314 (4.973) data 0.001 (0.012) loss 0.3541 (1.4972) lr 1.0000e-05 eta 5 days, 6:59:53
epoch [5/50] batch [80/2000] time 5.832 (5.047) data 0.000 (0.009) loss 4.4910 (1.5474) lr 1.0000e-05 eta 5 days, 8:52:37
epoch [5/50] batch [100/2000] time 2.998 (4.804) data 0.001 (0.007) loss 3.3714 (1.5604) lr 1.0000e-05 eta 5 days, 2:38:42
epoch [5/50] batch [120/2000] time 4.178 (4.743) data 0.000 (0.006) loss 3.3540 (1.5669) lr 1.0000e-05 eta 5 days, 1:03:48
epoch [5/50] batch [140/2000] time 6.189 (4.746) data 0.000 (0.005) loss 0.5727 (1.5212) lr 1.0000e-05 eta 5 days, 1:05:52
epoch [5/50] batch [160/2000] time 6.243 (4.916) data 0.000 (0.005) loss 1.4904 (1.5500) lr 1.0000e-05 eta 5 days, 5:25:14
epoch [5/50] batch [180/2000] time 5.430 (5.043) data 0.000 (0.004) loss 1.4385 (1.5554) lr 1.0000e-05 eta 5 days, 8:37:05
epoch [5/50] batch [200/2000] time 4.441 (5.089) data 0.000 (0.004) loss 0.6020 (1.5758) lr 1.0000e-05 eta 5 days, 9:46:07
epoch [5/50] batch [220/2000] time 5.522 (5.130) data 0.000 (0.004) loss 0.3202 (1.5501) lr 1.0000e-05 eta 5 days, 10:47:26
epoch [5/50] batch [240/2000] time 4.727 (5.149) data 0.000 (0.003) loss 0.3097 (1.5525) lr 1.0000e-05 eta 5 days, 11:14:31
epoch [5/50] batch [260/2000] time 4.523 (5.126) data 0.000 (0.003) loss 1.4456 (1.5364) lr 1.0000e-05 eta 5 days, 10:37:12
epoch [5/50] batch [280/2000] time 6.122 (5.153) data 0.000 (0.003) loss 0.4276 (1.5224) lr 1.0000e-05 eta 5 days, 11:17:35
epoch [5/50] batch [300/2000] time 6.064 (5.191) data 0.000 (0.003) loss 0.7084 (1.5295) lr 1.0000e-05 eta 5 days, 12:14:08
epoch [5/50] batch [320/2000] time 4.472 (5.162) data 0.002 (0.003) loss 2.1371 (1.5540) lr 1.0000e-05 eta 5 days, 11:27:59
epoch [5/50] batch [340/2000] time 5.425 (5.162) data 0.001 (0.003) loss 1.6314 (1.5440) lr 1.0000e-05 eta 5 days, 11:26:15
epoch [5/50] batch [360/2000] time 4.654 (5.163) data 0.000 (0.002) loss 1.6643 (1.5327) lr 1.0000e-05 eta 5 days, 11:25:47
epoch [5/50] batch [380/2000] time 6.001 (5.179) data 0.004 (0.002) loss 2.3281 (1.5352) lr 1.0000e-05 eta 5 days, 11:48:55
epoch [5/50] batch [400/2000] time 6.010 (5.210) data 0.000 (0.002) loss 1.7782 (1.5360) lr 1.0000e-05 eta 5 days, 12:33:49
epoch [5/50] batch [420/2000] time 5.957 (5.237) data 0.000 (0.002) loss 1.3353 (1.5188) lr 1.0000e-05 eta 5 days, 13:13:51
epoch [5/50] batch [440/2000] time 5.708 (5.261) data 0.000 (0.002) loss 1.1075 (1.5103) lr 1.0000e-05 eta 5 days, 13:48:01
epoch [5/50] batch [460/2000] time 4.532 (5.253) data 0.000 (0.002) loss 2.8121 (1.4925) lr 1.0000e-05 eta 5 days, 13:34:39
epoch [5/50] batch [480/2000] time 4.817 (5.246) data 0.001 (0.002) loss 1.1133 (1.4886) lr 1.0000e-05 eta 5 days, 13:21:50
epoch [5/50] batch [500/2000] time 6.039 (5.257) data 0.000 (0.002) loss 0.9005 (1.5003) lr 1.0000e-05 eta 5 days, 13:37:04
epoch [5/50] batch [520/2000] time 4.628 (5.267) data 0.000 (0.002) loss 1.1290 (1.4946) lr 1.0000e-05 eta 5 days, 13:50:01
epoch [5/50] batch [540/2000] time 6.022 (5.279) data 0.000 (0.002) loss 1.4901 (1.4892) lr 1.0000e-05 eta 5 days, 14:07:31
epoch [5/50] batch [560/2000] time 5.991 (5.298) data 0.000 (0.002) loss 1.5657 (1.4953) lr 1.0000e-05 eta 5 days, 14:33:57
epoch [5/50] batch [580/2000] time 6.143 (5.317) data 0.000 (0.002) loss 0.2274 (1.4998) lr 1.0000e-05 eta 5 days, 15:00:49
epoch [5/50] batch [600/2000] time 5.891 (5.308) data 0.001 (0.002) loss 1.0195 (1.4862) lr 1.0000e-05 eta 5 days, 14:45:56
epoch [5/50] batch [620/2000] time 6.368 (5.342) data 0.000 (0.002) loss 0.7253 (1.4909) lr 1.0000e-05 eta 5 days, 15:36:06
epoch [5/50] batch [640/2000] time 6.302 (5.371) data 0.000 (0.002) loss 1.2083 (1.4915) lr 1.0000e-05 eta 5 days, 16:18:13
epoch [5/50] batch [660/2000] time 6.393 (5.398) data 0.000 (0.002) loss 1.3773 (1.4821) lr 1.0000e-05 eta 5 days, 16:57:21
epoch [5/50] batch [680/2000] time 6.280 (5.426) data 0.000 (0.002) loss 0.2321 (1.4737) lr 1.0000e-05 eta 5 days, 17:37:40
epoch [5/50] batch [700/2000] time 6.344 (5.450) data 0.000 (0.002) loss 3.1880 (1.4810) lr 1.0000e-05 eta 5 days, 18:12:19
epoch [5/50] batch [720/2000] time 6.363 (5.471) data 0.000 (0.002) loss 2.1834 (1.4855) lr 1.0000e-05 eta 5 days, 18:43:49
epoch [5/50] batch [740/2000] time 6.353 (5.495) data 0.012 (0.002) loss 0.5756 (1.4855) lr 1.0000e-05 eta 5 days, 19:18:02
epoch [5/50] batch [760/2000] time 6.370 (5.515) data 0.000 (0.001) loss 0.0267 (1.4787) lr 1.0000e-05 eta 5 days, 19:46:44
epoch [5/50] batch [780/2000] time 6.429 (5.534) data 0.000 (0.001) loss 1.3533 (1.4831) lr 1.0000e-05 eta 5 days, 20:13:59
epoch [5/50] batch [800/2000] time 6.265 (5.555) data 0.000 (0.001) loss 0.6174 (1.4810) lr 1.0000e-05 eta 5 days, 20:43:12
epoch [5/50] batch [820/2000] time 6.317 (5.572) data 0.000 (0.001) loss 1.0853 (1.4804) lr 1.0000e-05 eta 5 days, 21:06:58
epoch [5/50] batch [840/2000] time 6.367 (5.589) data 0.001 (0.001) loss 2.4927 (1.4825) lr 1.0000e-05 eta 5 days, 21:30:56
epoch [5/50] batch [860/2000] time 6.374 (5.607) data 0.000 (0.001) loss 1.1762 (1.4804) lr 1.0000e-05 eta 5 days, 21:56:36
epoch [5/50] batch [880/2000] time 6.492 (5.622) data 0.000 (0.001) loss 0.7263 (1.4872) lr 1.0000e-05 eta 5 days, 22:18:09
epoch [5/50] batch [900/2000] time 6.370 (5.636) data 0.000 (0.001) loss 1.5490 (1.4877) lr 1.0000e-05 eta 5 days, 22:37:26
epoch [5/50] batch [920/2000] time 6.322 (5.652) data 0.000 (0.001) loss 2.7925 (1.4840) lr 1.0000e-05 eta 5 days, 22:59:30
epoch [5/50] batch [940/2000] time 6.359 (5.665) data 0.000 (0.001) loss 0.6710 (1.4778) lr 1.0000e-05 eta 5 days, 23:17:19
epoch [5/50] batch [960/2000] time 6.171 (5.675) data 0.000 (0.001) loss 0.2268 (1.4785) lr 1.0000e-05 eta 5 days, 23:30:55
epoch [5/50] batch [980/2000] time 4.580 (5.683) data 0.000 (0.001) loss 0.6110 (1.4751) lr 1.0000e-05 eta 5 days, 23:41:35
epoch [5/50] batch [1000/2000] time 6.135 (5.693) data 0.000 (0.001) loss 2.2653 (1.4745) lr 1.0000e-05 eta 5 days, 23:53:45
epoch [5/50] batch [1020/2000] time 6.172 (5.699) data 0.000 (0.001) loss 0.4237 (1.4711) lr 1.0000e-05 eta 6 days, 0:02:12
epoch [5/50] batch [1040/2000] time 6.162 (5.706) data 0.001 (0.001) loss 0.5437 (1.4665) lr 1.0000e-05 eta 6 days, 0:10:53
epoch [5/50] batch [1060/2000] time 6.166 (5.715) data 0.000 (0.001) loss 1.0968 (1.4725) lr 1.0000e-05 eta 6 days, 0:21:46
epoch [5/50] batch [1080/2000] time 6.170 (5.721) data 0.000 (0.001) loss 1.2113 (1.4803) lr 1.0000e-05 eta 6 days, 0:29:41
epoch [5/50] batch [1100/2000] time 6.168 (5.727) data 0.000 (0.001) loss 1.5733 (1.4788) lr 1.0000e-05 eta 6 days, 0:36:36
epoch [5/50] batch [1120/2000] time 6.160 (5.734) data 0.000 (0.001) loss 2.5598 (1.4809) lr 1.0000e-05 eta 6 days, 0:45:43
epoch [5/50] batch [1140/2000] time 6.234 (5.740) data 0.001 (0.001) loss 0.3256 (1.4815) lr 1.0000e-05 eta 6 days, 0:52:52
epoch [5/50] batch [1160/2000] time 6.168 (5.746) data 0.009 (0.001) loss 0.6205 (1.4746) lr 1.0000e-05 eta 6 days, 0:59:54
epoch [5/50] batch [1180/2000] time 6.230 (5.753) data 0.000 (0.001) loss 0.8589 (1.4701) lr 1.0000e-05 eta 6 days, 1:08:20
epoch [5/50] batch [1200/2000] time 4.689 (5.738) data 0.001 (0.001) loss 1.4618 (1.4652) lr 1.0000e-05 eta 6 days, 0:43:37
epoch [5/50] batch [1220/2000] time 4.856 (5.720) data 0.000 (0.001) loss 0.6588 (1.4636) lr 1.0000e-05 eta 6 days, 0:14:51
epoch [5/50] batch [1240/2000] time 6.026 (5.716) data 0.000 (0.001) loss 0.5758 (1.4613) lr 1.0000e-05 eta 6 days, 0:06:50
epoch [5/50] batch [1260/2000] time 5.957 (5.719) data 0.001 (0.001) loss 1.1534 (1.4605) lr 1.0000e-05 eta 6 days, 0:09:08
epoch [5/50] batch [1280/2000] time 5.975 (5.722) data 0.000 (0.001) loss 0.5142 (1.4624) lr 1.0000e-05 eta 6 days, 0:11:55
epoch [5/50] batch [1300/2000] time 6.030 (5.724) data 0.001 (0.001) loss 0.1982 (1.4578) lr 1.0000e-05 eta 6 days, 0:13:26
epoch [5/50] batch [1320/2000] time 4.783 (5.726) data 0.000 (0.001) loss 3.1835 (1.4592) lr 1.0000e-05 eta 6 days, 0:14:25
epoch [5/50] batch [1340/2000] time 5.542 (5.708) data 0.000 (0.001) loss 0.3922 (1.4581) lr 1.0000e-05 eta 5 days, 23:44:30
epoch [5/50] batch [1360/2000] time 5.739 (5.706) data 0.000 (0.001) loss 1.4985 (1.4619) lr 1.0000e-05 eta 5 days, 23:40:05
epoch [5/50] batch [1380/2000] time 4.238 (5.699) data 0.000 (0.001) loss 0.1192 (1.4584) lr 1.0000e-05 eta 5 days, 23:27:59
epoch [5/50] batch [1400/2000] time 4.274 (5.683) data 0.000 (0.001) loss 1.3717 (1.4563) lr 1.0000e-05 eta 5 days, 23:01:20
epoch [5/50] batch [1420/2000] time 5.813 (5.675) data 0.000 (0.001) loss 1.3382 (1.4522) lr 1.0000e-05 eta 5 days, 22:47:15
epoch [5/50] batch [1440/2000] time 5.756 (5.672) data 0.000 (0.001) loss 2.0147 (1.4515) lr 1.0000e-05 eta 5 days, 22:40:48
epoch [5/50] batch [1460/2000] time 4.752 (5.669) data 0.000 (0.001) loss 0.1617 (1.4510) lr 1.0000e-05 eta 5 days, 22:35:02
epoch [5/50] batch [1480/2000] time 4.353 (5.661) data 0.000 (0.001) loss 1.1143 (1.4461) lr 1.0000e-05 eta 5 days, 22:20:15
epoch [5/50] batch [1500/2000] time 5.034 (5.644) data 0.000 (0.001) loss 2.3591 (1.4448) lr 1.0000e-05 eta 5 days, 21:53:44
epoch [5/50] batch [1520/2000] time 5.477 (5.639) data 0.000 (0.001) loss 0.9310 (1.4450) lr 1.0000e-05 eta 5 days, 21:43:36
epoch [5/50] batch [1540/2000] time 4.582 (5.627) data 0.000 (0.001) loss 1.3960 (1.4427) lr 1.0000e-05 eta 5 days, 21:23:04
epoch [5/50] batch [1560/2000] time 4.868 (5.626) data 0.000 (0.001) loss 0.2684 (1.4434) lr 1.0000e-05 eta 5 days, 21:20:57
epoch [5/50] batch [1580/2000] time 5.030 (5.626) data 0.000 (0.001) loss 0.6529 (1.4406) lr 1.0000e-05 eta 5 days, 21:18:55
epoch [5/50] batch [1600/2000] time 4.322 (5.624) data 0.000 (0.001) loss 0.6724 (1.4403) lr 1.0000e-05 eta 5 days, 21:13:00
epoch [5/50] batch [1620/2000] time 5.576 (5.614) data 0.000 (0.001) loss 3.6029 (1.4421) lr 1.0000e-05 eta 5 days, 20:56:08
epoch [5/50] batch [1640/2000] time 4.646 (5.601) data 0.000 (0.001) loss 0.3933 (1.4379) lr 1.0000e-05 eta 5 days, 20:35:42
epoch [5/50] batch [1660/2000] time 5.127 (5.602) data 0.000 (0.001) loss 1.8154 (1.4368) lr 1.0000e-05 eta 5 days, 20:34:08
epoch [5/50] batch [1680/2000] time 4.565 (5.596) data 0.013 (0.001) loss 0.3345 (1.4353) lr 1.0000e-05 eta 5 days, 20:23:46
epoch [5/50] batch [1700/2000] time 5.803 (5.595) data 0.000 (0.001) loss 0.5469 (1.4291) lr 1.0000e-05 eta 5 days, 20:20:54
epoch [5/50] batch [1720/2000] time 5.804 (5.595) data 0.000 (0.001) loss 1.6940 (1.4288) lr 1.0000e-05 eta 5 days, 20:18:02
epoch [5/50] batch [1740/2000] time 5.778 (5.594) data 0.000 (0.001) loss 1.1232 (1.4298) lr 1.0000e-05 eta 5 days, 20:15:16
epoch [5/50] batch [1760/2000] time 5.701 (5.594) data 0.000 (0.001) loss 1.9906 (1.4293) lr 1.0000e-05 eta 5 days, 20:12:54
epoch [5/50] batch [1780/2000] time 6.319 (5.585) data 0.000 (0.001) loss 3.6393 (1.4283) lr 1.0000e-05 eta 5 days, 19:57:41
epoch [5/50] batch [1800/2000] time 6.136 (5.591) data 0.006 (0.001) loss 2.3462 (1.4279) lr 1.0000e-05 eta 5 days, 20:05:48
epoch [5/50] batch [1820/2000] time 6.216 (5.597) data 0.000 (0.001) loss 0.9584 (1.4283) lr 1.0000e-05 eta 5 days, 20:11:57
epoch [5/50] batch [1840/2000] time 6.219 (5.602) data 0.000 (0.001) loss 3.4772 (1.4294) lr 1.0000e-05 eta 5 days, 20:17:55
epoch [5/50] batch [1860/2000] time 6.276 (5.608) data 0.000 (0.001) loss 0.8985 (1.4279) lr 1.0000e-05 eta 5 days, 20:25:26
epoch [5/50] batch [1880/2000] time 6.122 (5.613) data 0.000 (0.001) loss 0.6498 (1.4256) lr 1.0000e-05 eta 5 days, 20:30:46
epoch [5/50] batch [1900/2000] time 6.395 (5.619) data 0.000 (0.001) loss 1.7982 (1.4245) lr 1.0000e-05 eta 5 days, 20:38:01
epoch [5/50] batch [1920/2000] time 6.340 (5.627) data 0.000 (0.001) loss 1.2227 (1.4258) lr 1.0000e-05 eta 5 days, 20:47:45
epoch [5/50] batch [1940/2000] time 6.348 (5.634) data 0.000 (0.001) loss 1.3034 (1.4258) lr 1.0000e-05 eta 5 days, 20:56:00
epoch [5/50] batch [1960/2000] time 6.396 (5.640) data 0.000 (0.001) loss 2.6831 (1.4235) lr 1.0000e-05 eta 5 days, 21:03:33
epoch [5/50] batch [1980/2000] time 6.393 (5.647) data 0.000 (0.001) loss 0.6636 (1.4235) lr 1.0000e-05 eta 5 days, 21:12:55
epoch [5/50] batch [2000/2000] time 6.405 (5.654) data 0.000 (0.001) loss 2.0435 (1.4227) lr 2.0000e-03 eta 5 days, 21:20:22
epoch [6/50] batch [20/2000] time 6.321 (6.267) data 0.000 (0.030) loss 0.4985 (1.9314) lr 2.0000e-03 eta 6 days, 12:38:10
epoch [6/50] batch [40/2000] time 6.248 (6.247) data 0.000 (0.016) loss 0.2785 (1.9428) lr 2.0000e-03 eta 6 days, 12:06:37
epoch [6/50] batch [60/2000] time 6.403 (6.283) data 0.001 (0.010) loss 0.4112 (1.8447) lr 2.0000e-03 eta 6 days, 12:58:54
epoch [6/50] batch [80/2000] time 6.449 (6.278) data 0.000 (0.008) loss 0.8592 (1.7783) lr 2.0000e-03 eta 6 days, 12:48:36
epoch [6/50] batch [100/2000] time 6.367 (6.281) data 0.000 (0.006) loss 2.0708 (1.8117) lr 2.0000e-03 eta 6 days, 12:51:46
epoch [6/50] batch [120/2000] time 6.393 (6.294) data 0.000 (0.005) loss 0.9801 (1.7490) lr 2.0000e-03 eta 6 days, 13:08:33
epoch [6/50] batch [140/2000] time 6.354 (6.287) data 0.000 (0.005) loss 0.7721 (1.7429) lr 2.0000e-03 eta 6 days, 12:56:26
epoch [6/50] batch [160/2000] time 5.886 (6.262) data 0.000 (0.004) loss 0.6673 (1.6964) lr 2.0000e-03 eta 6 days, 12:16:41
epoch [6/50] batch [180/2000] time 6.212 (6.136) data 0.000 (0.004) loss 1.0354 (1.6407) lr 2.0000e-03 eta 6 days, 9:05:35
epoch [6/50] batch [200/2000] time 6.145 (6.134) data 0.000 (0.003) loss 4.5202 (1.6299) lr 2.0000e-03 eta 6 days, 9:00:16
epoch [6/50] batch [220/2000] time 6.241 (6.132) data 0.000 (0.003) loss 0.0136 (1.5945) lr 2.0000e-03 eta 6 days, 8:55:34
epoch [6/50] batch [240/2000] time 6.328 (6.128) data 0.000 (0.003) loss 0.6647 (1.5618) lr 2.0000e-03 eta 6 days, 8:47:09
epoch [6/50] batch [260/2000] time 5.228 (6.039) data 0.001 (0.003) loss 0.4437 (1.5543) lr 2.0000e-03 eta 6 days, 6:32:40
epoch [6/50] batch [280/2000] time 4.289 (5.956) data 0.000 (0.003) loss 2.0665 (1.5413) lr 2.0000e-03 eta 6 days, 4:25:56
epoch [6/50] batch [300/2000] time 4.901 (5.874) data 0.000 (0.003) loss 3.7055 (1.5457) lr 2.0000e-03 eta 6 days, 2:21:15
epoch [6/50] batch [320/2000] time 4.205 (5.779) data 0.000 (0.002) loss 0.7833 (1.5344) lr 2.0000e-03 eta 5 days, 23:58:06
epoch [6/50] batch [340/2000] time 4.404 (5.683) data 0.000 (0.002) loss 0.5537 (1.5416) lr 2.0000e-03 eta 5 days, 21:32:51
epoch [6/50] batch [360/2000] time 4.815 (5.644) data 0.000 (0.002) loss 1.2974 (1.5237) lr 2.0000e-03 eta 5 days, 20:31:56
epoch [6/50] batch [380/2000] time 3.966 (5.556) data 0.000 (0.002) loss 0.1786 (1.5320) lr 2.0000e-03 eta 5 days, 18:19:29
epoch [6/50] batch [400/2000] time 2.466 (5.449) data 0.000 (0.002) loss 1.3622 (1.5265) lr 2.0000e-03 eta 5 days, 15:37:34
epoch [6/50] batch [420/2000] time 3.608 (5.320) data 0.000 (0.002) loss 0.4625 (1.5120) lr 2.0000e-03 eta 5 days, 12:22:37
epoch [6/50] batch [440/2000] time 2.470 (5.209) data 0.000 (0.002) loss 0.6795 (1.4880) lr 2.0000e-03 eta 5 days, 9:35:56
epoch [6/50] batch [460/2000] time 3.479 (5.115) data 0.000 (0.002) loss 0.2363 (1.4805) lr 2.0000e-03 eta 5 days, 7:13:33
epoch [6/50] batch [480/2000] time 3.992 (5.051) data 0.000 (0.002) loss 2.8916 (1.4712) lr 2.0000e-03 eta 5 days, 5:35:21
epoch [6/50] batch [500/2000] time 4.198 (4.980) data 0.000 (0.002) loss 2.3021 (1.4683) lr 2.0000e-03 eta 5 days, 3:49:01
epoch [6/50] batch [520/2000] time 3.984 (4.914) data 0.001 (0.002) loss 1.2952 (1.4678) lr 2.0000e-03 eta 5 days, 2:08:36
epoch [6/50] batch [540/2000] time 3.706 (4.866) data 0.000 (0.002) loss 0.1187 (1.4653) lr 2.0000e-03 eta 5 days, 0:54:44
epoch [6/50] batch [560/2000] time 2.399 (4.815) data 0.000 (0.002) loss 1.7700 (1.4647) lr 2.0000e-03 eta 4 days, 23:37:03
epoch [6/50] batch [580/2000] time 4.363 (4.748) data 0.000 (0.002) loss 0.7298 (1.4532) lr 2.0000e-03 eta 4 days, 21:56:32
epoch [6/50] batch [600/2000] time 4.343 (4.734) data 0.001 (0.002) loss 1.4798 (1.4612) lr 2.0000e-03 eta 4 days, 21:33:55
epoch [6/50] batch [620/2000] time 4.365 (4.715) data 0.000 (0.001) loss 2.3813 (1.4581) lr 2.0000e-03 eta 4 days, 21:03:04
epoch [6/50] batch [640/2000] time 4.283 (4.696) data 0.000 (0.001) loss 0.0922 (1.4504) lr 2.0000e-03 eta 4 days, 20:34:27
epoch [6/50] batch [660/2000] time 4.347 (4.685) data 0.000 (0.001) loss 2.7471 (1.4486) lr 2.0000e-03 eta 4 days, 20:15:28
epoch [6/50] batch [680/2000] time 4.373 (4.668) data 0.000 (0.001) loss 2.7830 (1.4475) lr 2.0000e-03 eta 4 days, 19:49:37
epoch [6/50] batch [700/2000] time 3.981 (4.652) data 0.000 (0.001) loss 0.8335 (1.4556) lr 2.0000e-03 eta 4 days, 19:22:59
epoch [6/50] batch [720/2000] time 4.376 (4.642) data 0.000 (0.001) loss 1.1080 (1.4557) lr 2.0000e-03 eta 4 days, 19:07:16
epoch [6/50] batch [740/2000] time 4.243 (4.627) data 0.000 (0.001) loss 0.5731 (1.4540) lr 2.0000e-03 eta 4 days, 18:43:50
epoch [6/50] batch [760/2000] time 4.317 (4.615) data 0.000 (0.001) loss 1.3714 (1.4585) lr 2.0000e-03 eta 4 days, 18:23:30
epoch [6/50] batch [780/2000] time 4.358 (4.607) data 0.000 (0.001) loss 1.6728 (1.4516) lr 2.0000e-03 eta 4 days, 18:10:56
epoch [6/50] batch [800/2000] time 4.338 (4.595) data 0.000 (0.001) loss 1.3731 (1.4487) lr 2.0000e-03 eta 4 days, 17:51:53
epoch [6/50] batch [820/2000] time 4.335 (4.584) data 0.000 (0.001) loss 0.6218 (1.4469) lr 2.0000e-03 eta 4 days, 17:33:48
epoch [6/50] batch [840/2000] time 4.256 (4.578) data 0.000 (0.001) loss 0.1575 (1.4520) lr 2.0000e-03 eta 4 days, 17:22:23
epoch [6/50] batch [860/2000] time 4.247 (4.568) data 0.000 (0.001) loss 0.9123 (1.4471) lr 2.0000e-03 eta 4 days, 17:06:42
epoch [6/50] batch [880/2000] time 4.371 (4.558) data 0.000 (0.001) loss 0.2261 (1.4516) lr 2.0000e-03 eta 4 days, 16:50:13
epoch [6/50] batch [900/2000] time 2.451 (4.550) data 0.000 (0.001) loss 0.5406 (1.4453) lr 2.0000e-03 eta 4 days, 16:37:24
epoch [6/50] batch [920/2000] time 4.364 (4.545) data 0.000 (0.001) loss 0.4862 (1.4418) lr 2.0000e-03 eta 4 days, 16:27:43
epoch [6/50] batch [940/2000] time 4.307 (4.537) data 0.000 (0.001) loss 3.7146 (1.4454) lr 2.0000e-03 eta 4 days, 16:13:57
epoch [6/50] batch [960/2000] time 2.481 (4.527) data 0.000 (0.001) loss 1.1206 (1.4412) lr 2.0000e-03 eta 4 days, 15:57:46
epoch [6/50] batch [980/2000] time 2.460 (4.488) data 0.000 (0.001) loss 1.5547 (1.4448) lr 2.0000e-03 eta 4 days, 14:58:01
epoch [6/50] batch [1000/2000] time 2.417 (4.449) data 0.000 (0.001) loss 0.9239 (1.4435) lr 2.0000e-03 eta 4 days, 14:00:03
epoch [6/50] batch [1020/2000] time 2.487 (4.412) data 0.000 (0.001) loss 2.4230 (1.4384) lr 2.0000e-03 eta 4 days, 13:03:29
epoch [6/50] batch [1040/2000] time 3.028 (4.380) data 0.000 (0.001) loss 2.5899 (1.4342) lr 2.0000e-03 eta 4 days, 12:13:39
epoch [6/50] batch [1060/2000] time 4.059 (4.352) data 0.000 (0.001) loss 1.6510 (1.4329) lr 2.0000e-03 eta 4 days, 11:31:34
epoch [6/50] batch [1080/2000] time 4.146 (4.344) data 0.001 (0.001) loss 3.1078 (1.4290) lr 2.0000e-03 eta 4 days, 11:18:00
epoch [6/50] batch [1100/2000] time 4.149 (4.336) data 0.001 (0.001) loss 2.3140 (1.4302) lr 2.0000e-03 eta 4 days, 11:04:28
epoch [6/50] batch [1120/2000] time 4.101 (4.329) data 0.000 (0.001) loss 0.3628 (1.4232) lr 2.0000e-03 eta 4 days, 10:52:03
epoch [6/50] batch [1140/2000] time 4.025 (4.322) data 0.001 (0.001) loss 3.2346 (1.4203) lr 2.0000e-03 eta 4 days, 10:40:19
epoch [6/50] batch [1160/2000] time 4.114 (4.314) data 0.000 (0.001) loss 2.4293 (1.4209) lr 2.0000e-03 eta 4 days, 10:27:38
epoch [6/50] batch [1180/2000] time 4.007 (4.308) data 0.001 (0.001) loss 0.3332 (1.4202) lr 2.0000e-03 eta 4 days, 10:16:38
epoch [6/50] batch [1200/2000] time 4.104 (4.301) data 0.000 (0.001) loss 0.8321 (1.4240) lr 2.0000e-03 eta 4 days, 10:06:06
epoch [6/50] batch [1220/2000] time 3.357 (4.279) data 0.000 (0.001) loss 0.6716 (1.4203) lr 2.0000e-03 eta 4 days, 9:31:14
epoch [6/50] batch [1240/2000] time 3.790 (4.260) data 0.001 (0.001) loss 0.1818 (1.4205) lr 2.0000e-03 eta 4 days, 9:01:40
epoch [6/50] batch [1260/2000] time 3.317 (4.250) data 0.000 (0.001) loss 1.1253 (1.4193) lr 2.0000e-03 eta 4 days, 8:46:15
epoch [6/50] batch [1280/2000] time 2.444 (4.223) data 0.000 (0.001) loss 1.5458 (1.4272) lr 2.0000e-03 eta 4 days, 8:04:52
epoch [6/50] batch [1300/2000] time 2.997 (4.197) data 0.000 (0.001) loss 3.1182 (1.4257) lr 2.0000e-03 eta 4 days, 7:24:32
epoch [6/50] batch [1320/2000] time 2.460 (4.172) data 0.000 (0.001) loss 2.6705 (1.4251) lr 2.0000e-03 eta 4 days, 6:45:37
epoch [6/50] batch [1340/2000] time 2.464 (4.147) data 0.000 (0.001) loss 2.3952 (1.4187) lr 2.0000e-03 eta 4 days, 6:08:33
epoch [6/50] batch [1360/2000] time 2.630 (4.124) data 0.000 (0.001) loss 0.9472 (1.4163) lr 2.0000e-03 eta 4 days, 5:33:11
epoch [6/50] batch [1380/2000] time 2.507 (4.102) data 0.000 (0.001) loss 1.4531 (1.4127) lr 2.0000e-03 eta 4 days, 4:58:40
epoch [6/50] batch [1400/2000] time 2.537 (4.081) data 0.000 (0.001) loss 2.2327 (1.4132) lr 2.0000e-03 eta 4 days, 4:25:39
epoch [6/50] batch [1420/2000] time 2.514 (4.060) data 0.000 (0.001) loss 0.3822 (1.4084) lr 2.0000e-03 eta 4 days, 3:53:48
epoch [6/50] batch [1440/2000] time 2.509 (4.038) data 0.000 (0.001) loss 2.5019 (1.4104) lr 2.0000e-03 eta 4 days, 3:20:39
epoch [6/50] batch [1460/2000] time 2.508 (4.017) data 0.000 (0.001) loss 3.1857 (1.4132) lr 2.0000e-03 eta 4 days, 2:47:47
epoch [6/50] batch [1480/2000] time 2.368 (3.996) data 0.000 (0.001) loss 2.9374 (1.4138) lr 2.0000e-03 eta 4 days, 2:15:41
epoch [6/50] batch [1500/2000] time 2.510 (3.976) data 0.000 (0.001) loss 3.5587 (1.4120) lr 2.0000e-03 eta 4 days, 1:44:16
epoch [6/50] batch [1520/2000] time 2.428 (3.956) data 0.000 (0.001) loss 0.3083 (1.4141) lr 2.0000e-03 eta 4 days, 1:13:50
epoch [6/50] batch [1540/2000] time 2.478 (3.937) data 0.000 (0.001) loss 1.0949 (1.4080) lr 2.0000e-03 eta 4 days, 0:44:03
epoch [6/50] batch [1560/2000] time 2.515 (3.918) data 0.000 (0.001) loss 1.3768 (1.4057) lr 2.0000e-03 eta 4 days, 0:15:06
epoch [6/50] batch [1580/2000] time 2.483 (3.900) data 0.000 (0.001) loss 1.8722 (1.4065) lr 2.0000e-03 eta 3 days, 23:46:49
epoch [6/50] batch [1600/2000] time 2.504 (3.882) data 0.000 (0.001) loss 1.3367 (1.4063) lr 2.0000e-03 eta 3 days, 23:19:02
epoch [6/50] batch [1620/2000] time 2.515 (3.864) data 0.000 (0.001) loss 0.2678 (1.4031) lr 2.0000e-03 eta 3 days, 22:52:17
epoch [6/50] batch [1640/2000] time 2.384 (3.847) data 0.000 (0.001) loss 1.1811 (1.3991) lr 2.0000e-03 eta 3 days, 22:25:44
epoch [6/50] batch [1660/2000] time 2.432 (3.831) data 0.000 (0.001) loss 1.5415 (1.3982) lr 2.0000e-03 eta 3 days, 22:00:03
epoch [6/50] batch [1680/2000] time 2.708 (3.815) data 0.001 (0.001) loss 2.7397 (1.3967) lr 2.0000e-03 eta 3 days, 21:35:17
epoch [6/50] batch [1700/2000] time 2.513 (3.799) data 0.000 (0.001) loss 0.3924 (1.3974) lr 2.0000e-03 eta 3 days, 21:10:47
epoch [6/50] batch [1720/2000] time 2.501 (3.784) data 0.000 (0.001) loss 0.2761 (1.3927) lr 2.0000e-03 eta 3 days, 20:46:58
epoch [6/50] batch [1740/2000] time 2.419 (3.769) data 0.000 (0.001) loss 0.8814 (1.3887) lr 2.0000e-03 eta 3 days, 20:23:35
epoch [6/50] batch [1760/2000] time 2.517 (3.754) data 0.000 (0.001) loss 0.0992 (1.3820) lr 2.0000e-03 eta 3 days, 20:00:34
epoch [6/50] batch [1780/2000] time 2.541 (3.740) data 0.000 (0.001) loss 0.3373 (1.3832) lr 2.0000e-03 eta 3 days, 19:38:23
epoch [6/50] batch [1800/2000] time 2.502 (3.725) data 0.000 (0.001) loss 1.6829 (1.3854) lr 2.0000e-03 eta 3 days, 19:16:29
epoch [6/50] batch [1820/2000] time 2.438 (3.712) data 0.000 (0.001) loss 2.6652 (1.3887) lr 2.0000e-03 eta 3 days, 18:54:43
epoch [6/50] batch [1840/2000] time 2.468 (3.698) data 0.001 (0.001) loss 0.2049 (1.3871) lr 2.0000e-03 eta 3 days, 18:33:48
epoch [6/50] batch [1860/2000] time 2.490 (3.685) data 0.000 (0.001) loss 2.4068 (1.3848) lr 2.0000e-03 eta 3 days, 18:13:16
epoch [6/50] batch [1880/2000] time 2.515 (3.672) data 0.000 (0.001) loss 0.9968 (1.3862) lr 2.0000e-03 eta 3 days, 17:53:14
epoch [6/50] batch [1900/2000] time 2.416 (3.660) data 0.000 (0.001) loss 1.9488 (1.3848) lr 2.0000e-03 eta 3 days, 17:33:25
epoch [6/50] batch [1920/2000] time 2.458 (3.647) data 0.000 (0.001) loss 2.7397 (1.3868) lr 2.0000e-03 eta 3 days, 17:13:52
epoch [6/50] batch [1940/2000] time 2.512 (3.635) data 0.004 (0.001) loss 0.8471 (1.3846) lr 2.0000e-03 eta 3 days, 16:54:59
epoch [6/50] batch [1960/2000] time 2.483 (3.623) data 0.000 (0.001) loss 1.5047 (1.3851) lr 2.0000e-03 eta 3 days, 16:36:22
epoch [6/50] batch [1980/2000] time 2.467 (3.612) data 0.000 (0.001) loss 2.3148 (1.3873) lr 2.0000e-03 eta 3 days, 16:18:25
epoch [6/50] batch [2000/2000] time 2.420 (3.600) data 0.000 (0.001) loss 0.3757 (1.3833) lr 1.9980e-03 eta 3 days, 16:00:35
epoch [7/50] batch [20/2000] time 2.461 (2.523) data 0.000 (0.037) loss 2.4883 (1.0512) lr 1.9980e-03 eta 2 days, 13:39:45
epoch [7/50] batch [40/2000] time 2.397 (2.488) data 0.000 (0.019) loss 0.8711 (1.1330) lr 1.9980e-03 eta 2 days, 12:47:53
epoch [7/50] batch [60/2000] time 2.488 (2.483) data 0.001 (0.013) loss 2.9140 (1.0852) lr 1.9980e-03 eta 2 days, 12:39:13
epoch [7/50] batch [80/2000] time 2.463 (2.481) data 0.000 (0.010) loss 2.7428 (1.1627) lr 1.9980e-03 eta 2 days, 12:35:57
epoch [7/50] batch [100/2000] time 2.513 (2.478) data 0.000 (0.008) loss 1.0788 (1.1670) lr 1.9980e-03 eta 2 days, 12:30:19
epoch [7/50] batch [120/2000] time 2.510 (2.477) data 0.000 (0.006) loss 1.7632 (1.1595) lr 1.9980e-03 eta 2 days, 12:28:18
epoch [7/50] batch [140/2000] time 2.427 (2.475) data 0.000 (0.006) loss 0.3738 (1.1047) lr 1.9980e-03 eta 2 days, 12:24:32
epoch [7/50] batch [160/2000] time 2.439 (2.474) data 0.000 (0.005) loss 0.4333 (1.0889) lr 1.9980e-03 eta 2 days, 12:22:20
epoch [7/50] batch [180/2000] time 2.451 (2.474) data 0.000 (0.004) loss 0.2526 (1.1164) lr 1.9980e-03 eta 2 days, 12:20:30
epoch [7/50] batch [200/2000] time 2.505 (2.472) data 0.000 (0.004) loss 0.3944 (1.1228) lr 1.9980e-03 eta 2 days, 12:17:45
epoch [7/50] batch [220/2000] time 2.439 (2.472) data 0.001 (0.004) loss 0.5604 (1.1425) lr 1.9980e-03 eta 2 days, 12:15:56
epoch [7/50] batch [240/2000] time 2.509 (2.472) data 0.000 (0.003) loss 0.3176 (1.1418) lr 1.9980e-03 eta 2 days, 12:15:35
epoch [7/50] batch [260/2000] time 2.489 (2.471) data 0.000 (0.003) loss 0.4739 (1.1546) lr 1.9980e-03 eta 2 days, 12:13:45
epoch [7/50] batch [280/2000] time 2.497 (2.472) data 0.000 (0.003) loss 3.6647 (1.1380) lr 1.9980e-03 eta 2 days, 12:13:28
epoch [7/50] batch [300/2000] time 2.422 (2.472) data 0.000 (0.003) loss 1.1713 (1.1725) lr 1.9980e-03 eta 2 days, 12:12:31
epoch [7/50] batch [320/2000] time 2.510 (2.472) data 0.000 (0.003) loss 1.6346 (1.1721) lr 1.9980e-03 eta 2 days, 12:11:54
epoch [7/50] batch [340/2000] time 2.487 (2.472) data 0.000 (0.003) loss 2.3134 (1.1946) lr 1.9980e-03 eta 2 days, 12:11:38
epoch [7/50] batch [360/2000] time 2.506 (2.473) data 0.000 (0.002) loss 1.6677 (1.1870) lr 1.9980e-03 eta 2 days, 12:11:36
epoch [7/50] batch [380/2000] time 2.505 (2.473) data 0.000 (0.002) loss 2.0751 (1.2189) lr 1.9980e-03 eta 2 days, 12:11:05
epoch [7/50] batch [400/2000] time 2.441 (2.473) data 0.000 (0.002) loss 0.7676 (1.2126) lr 1.9980e-03 eta 2 days, 12:09:51
epoch [7/50] batch [420/2000] time 2.488 (2.472) data 0.000 (0.002) loss 0.3754 (1.2084) lr 1.9980e-03 eta 2 days, 12:08:14
epoch [7/50] batch [440/2000] time 2.495 (2.473) data 0.000 (0.002) loss 0.4003 (1.2210) lr 1.9980e-03 eta 2 days, 12:08:12
epoch [7/50] batch [460/2000] time 2.372 (2.472) data 0.001 (0.002) loss 0.5681 (1.2272) lr 1.9980e-03 eta 2 days, 12:07:10
epoch [7/50] batch [480/2000] time 2.487 (2.473) data 0.000 (0.002) loss 0.9870 (1.2287) lr 1.9980e-03 eta 2 days, 12:06:41
epoch [7/50] batch [500/2000] time 2.455 (2.473) data 0.000 (0.002) loss 0.7009 (1.2416) lr 1.9980e-03 eta 2 days, 12:06:02
epoch [7/50] batch [520/2000] time 2.486 (2.472) data 0.000 (0.002) loss 0.4754 (1.2349) lr 1.9980e-03 eta 2 days, 12:04:31
epoch [7/50] batch [540/2000] time 2.517 (2.472) data 0.000 (0.002) loss 1.4865 (1.2355) lr 1.9980e-03 eta 2 days, 12:03:45
epoch [7/50] batch [560/2000] time 2.488 (2.472) data 0.000 (0.002) loss 2.4241 (1.2379) lr 1.9980e-03 eta 2 days, 12:03:09
epoch [7/50] batch [580/2000] time 2.439 (2.472) data 0.000 (0.002) loss 2.7423 (1.2436) lr 1.9980e-03 eta 2 days, 12:01:45
epoch [7/50] batch [600/2000] time 2.512 (2.472) data 0.001 (0.002) loss 0.1929 (1.2435) lr 1.9980e-03 eta 2 days, 12:01:28
epoch [7/50] batch [620/2000] time 2.451 (2.472) data 0.000 (0.002) loss 1.7383 (1.2488) lr 1.9980e-03 eta 2 days, 12:00:41
epoch [7/50] batch [640/2000] time 2.483 (2.473) data 0.000 (0.002) loss 0.0380 (1.2362) lr 1.9980e-03 eta 2 days, 12:00:06
epoch [7/50] batch [660/2000] time 2.515 (2.473) data 0.001 (0.001) loss 1.4912 (1.2305) lr 1.9980e-03 eta 2 days, 11:59:23
epoch [7/50] batch [680/2000] time 2.483 (2.472) data 0.000 (0.001) loss 1.4222 (1.2278) lr 1.9980e-03 eta 2 days, 11:57:49
epoch [7/50] batch [700/2000] time 2.459 (2.472) data 0.000 (0.001) loss 1.7038 (1.2277) lr 1.9980e-03 eta 2 days, 11:57:03
epoch [7/50] batch [720/2000] time 2.421 (2.472) data 0.000 (0.001) loss 1.3340 (1.2332) lr 1.9980e-03 eta 2 days, 11:55:57
epoch [7/50] batch [740/2000] time 2.513 (2.472) data 0.000 (0.001) loss 0.1009 (1.2318) lr 1.9980e-03 eta 2 days, 11:55:09
epoch [7/50] batch [760/2000] time 2.462 (2.472) data 0.000 (0.001) loss 3.5888 (1.2431) lr 1.9980e-03 eta 2 days, 11:54:19
epoch [7/50] batch [780/2000] time 2.400 (2.472) data 0.000 (0.001) loss 0.0049 (1.2373) lr 1.9980e-03 eta 2 days, 11:53:26
epoch [7/50] batch [800/2000] time 2.506 (2.472) data 0.000 (0.001) loss 4.1720 (1.2461) lr 1.9980e-03 eta 2 days, 11:53:07
epoch [7/50] batch [820/2000] time 2.512 (2.473) data 0.000 (0.001) loss 1.0847 (1.2394) lr 1.9980e-03 eta 2 days, 11:52:32
epoch [7/50] batch [840/2000] time 2.492 (2.472) data 0.000 (0.001) loss 0.7582 (1.2389) lr 1.9980e-03 eta 2 days, 11:51:37
epoch [7/50] batch [860/2000] time 2.516 (2.472) data 0.000 (0.001) loss 2.4188 (1.2444) lr 1.9980e-03 eta 2 days, 11:50:45
epoch [7/50] batch [880/2000] time 2.344 (2.472) data 0.000 (0.001) loss 0.6466 (1.2392) lr 1.9980e-03 eta 2 days, 11:49:30
epoch [7/50] batch [900/2000] time 2.524 (2.472) data 0.000 (0.001) loss 2.2432 (1.2417) lr 1.9980e-03 eta 2 days, 11:48:52
epoch [7/50] batch [920/2000] time 2.509 (2.472) data 0.000 (0.001) loss 2.1312 (1.2517) lr 1.9980e-03 eta 2 days, 11:48:16
epoch [7/50] batch [940/2000] time 2.330 (2.472) data 0.000 (0.001) loss 0.3375 (1.2576) lr 1.9980e-03 eta 2 days, 11:46:46
epoch [7/50] batch [960/2000] time 2.458 (2.472) data 0.000 (0.001) loss 0.4561 (1.2607) lr 1.9980e-03 eta 2 days, 11:45:30
epoch [7/50] batch [980/2000] time 2.467 (2.472) data 0.001 (0.001) loss 0.7456 (1.2653) lr 1.9980e-03 eta 2 days, 11:44:50
epoch [7/50] batch [1000/2000] time 2.420 (2.472) data 0.000 (0.001) loss 0.4687 (1.2609) lr 1.9980e-03 eta 2 days, 11:43:49
epoch [7/50] batch [1020/2000] time 2.461 (2.472) data 0.000 (0.001) loss 0.1355 (1.2592) lr 1.9980e-03 eta 2 days, 11:43:04
epoch [7/50] batch [1040/2000] time 2.460 (2.472) data 0.000 (0.001) loss 2.0981 (1.2576) lr 1.9980e-03 eta 2 days, 11:42:35
epoch [7/50] batch [1060/2000] time 2.510 (2.472) data 0.000 (0.001) loss 1.0646 (1.2559) lr 1.9980e-03 eta 2 days, 11:41:22
epoch [7/50] batch [1080/2000] time 2.501 (2.472) data 0.000 (0.001) loss 2.3773 (1.2605) lr 1.9980e-03 eta 2 days, 11:40:48
epoch [7/50] batch [1100/2000] time 2.380 (2.472) data 0.000 (0.001) loss 1.7875 (1.2606) lr 1.9980e-03 eta 2 days, 11:40:13
epoch [7/50] batch [1120/2000] time 2.509 (2.472) data 0.000 (0.001) loss 0.2061 (1.2625) lr 1.9980e-03 eta 2 days, 11:39:25
epoch [7/50] batch [1140/2000] time 2.464 (2.472) data 0.001 (0.001) loss 0.8788 (1.2598) lr 1.9980e-03 eta 2 days, 11:38:47
epoch [7/50] batch [1160/2000] time 2.441 (2.472) data 0.000 (0.001) loss 0.3984 (1.2632) lr 1.9980e-03 eta 2 days, 11:37:52
epoch [7/50] batch [1180/2000] time 2.461 (2.472) data 0.000 (0.001) loss 0.1617 (1.2685) lr 1.9980e-03 eta 2 days, 11:37:02
epoch [7/50] batch [1200/2000] time 2.567 (2.472) data 0.000 (0.001) loss 0.4420 (1.2648) lr 1.9980e-03 eta 2 days, 11:36:31
epoch [7/50] batch [1220/2000] time 2.475 (2.476) data 0.000 (0.001) loss 1.0504 (1.2609) lr 1.9980e-03 eta 2 days, 11:41:22
epoch [7/50] batch [1240/2000] time 3.999 (2.485) data 0.004 (0.001) loss 0.7229 (1.2606) lr 1.9980e-03 eta 2 days, 11:52:40
epoch [7/50] batch [1260/2000] time 3.726 (2.501) data 0.000 (0.001) loss 0.0752 (1.2601) lr 1.9980e-03 eta 2 days, 12:15:10
epoch [7/50] batch [1280/2000] time 4.005 (2.517) data 0.000 (0.001) loss 0.1413 (1.2645) lr 1.9980e-03 eta 2 days, 12:37:38
epoch [7/50] batch [1300/2000] time 2.553 (2.529) data 0.000 (0.001) loss 0.7012 (1.2628) lr 1.9980e-03 eta 2 days, 12:55:06
epoch [7/50] batch [1320/2000] time 2.586 (2.531) data 0.004 (0.001) loss 2.1583 (1.2634) lr 1.9980e-03 eta 2 days, 12:56:04
epoch [7/50] batch [1340/2000] time 4.920 (2.557) data 0.001 (0.001) loss 1.9157 (1.2571) lr 1.9980e-03 eta 2 days, 13:33:35
epoch [7/50] batch [1360/2000] time 5.714 (2.594) data 0.001 (0.001) loss 0.2635 (1.2616) lr 1.9980e-03 eta 2 days, 14:25:26
epoch [7/50] batch [1380/2000] time 5.916 (2.640) data 0.000 (0.001) loss 0.8212 (1.2629) lr 1.9980e-03 eta 2 days, 15:30:39
epoch [7/50] batch [1400/2000] time 4.782 (2.681) data 0.000 (0.001) loss 2.7506 (1.2607) lr 1.9980e-03 eta 2 days, 16:30:12
epoch [7/50] batch [1420/2000] time 4.532 (2.709) data 0.000 (0.001) loss 2.1898 (1.2595) lr 1.9980e-03 eta 2 days, 17:08:34
epoch [7/50] batch [1440/2000] time 5.619 (2.745) data 0.000 (0.001) loss 0.4270 (1.2574) lr 1.9980e-03 eta 2 days, 18:00:50
epoch [7/50] batch [1460/2000] time 4.566 (2.777) data 0.000 (0.001) loss 3.1678 (1.2613) lr 1.9980e-03 eta 2 days, 18:45:20
epoch [7/50] batch [1480/2000] time 5.576 (2.815) data 0.001 (0.001) loss 4.4337 (1.2680) lr 1.9980e-03 eta 2 days, 19:39:02
epoch [7/50] batch [1500/2000] time 6.016 (2.855) data 0.001 (0.001) loss 1.0482 (1.2652) lr 1.9980e-03 eta 2 days, 20:35:53
epoch [7/50] batch [1520/2000] time 4.543 (2.887) data 0.000 (0.001) loss 0.5258 (1.2735) lr 1.9980e-03 eta 2 days, 21:21:46
epoch [7/50] batch [1540/2000] time 4.626 (2.915) data 0.000 (0.001) loss 0.4584 (1.2782) lr 1.9980e-03 eta 2 days, 22:00:50
epoch [7/50] batch [1560/2000] time 6.034 (2.946) data 0.000 (0.001) loss 0.4567 (1.2787) lr 1.9980e-03 eta 2 days, 22:44:29
epoch [7/50] batch [1580/2000] time 5.676 (2.983) data 0.000 (0.001) loss 0.0944 (1.2821) lr 1.9980e-03 eta 2 days, 23:36:17
epoch [7/50] batch [1600/2000] time 5.594 (3.013) data 0.000 (0.001) loss 1.7305 (1.2820) lr 1.9980e-03 eta 3 days, 0:18:53
epoch [7/50] batch [1620/2000] time 6.141 (3.043) data 0.001 (0.001) loss 0.1324 (1.2791) lr 1.9980e-03 eta 3 days, 1:01:12
epoch [7/50] batch [1640/2000] time 6.068 (3.076) data 0.000 (0.001) loss 0.1642 (1.2775) lr 1.9980e-03 eta 3 days, 1:47:44
epoch [7/50] batch [1660/2000] time 6.015 (3.109) data 0.001 (0.001) loss 1.1121 (1.2795) lr 1.9980e-03 eta 3 days, 2:34:19
epoch [7/50] batch [1680/2000] time 4.742 (3.134) data 0.001 (0.001) loss 0.9623 (1.2785) lr 1.9980e-03 eta 3 days, 3:08:14
epoch [7/50] batch [1700/2000] time 4.564 (3.151) data 0.000 (0.001) loss 0.5653 (1.2809) lr 1.9980e-03 eta 3 days, 3:31:33
epoch [7/50] batch [1720/2000] time 5.972 (3.182) data 0.000 (0.001) loss 1.5599 (1.2764) lr 1.9980e-03 eta 3 days, 4:15:03
epoch [7/50] batch [1740/2000] time 4.517 (3.211) data 0.001 (0.001) loss 0.0788 (1.2784) lr 1.9980e-03 eta 3 days, 4:55:48
epoch [7/50] batch [1760/2000] time 4.654 (3.229) data 0.000 (0.001) loss 1.0213 (1.2804) lr 1.9980e-03 eta 3 days, 5:21:01
epoch [7/50] batch [1780/2000] time 6.022 (3.249) data 0.000 (0.001) loss 0.8426 (1.2836) lr 1.9980e-03 eta 3 days, 5:48:15
epoch [7/50] batch [1800/2000] time 6.034 (3.276) data 0.000 (0.001) loss 1.1337 (1.2831) lr 1.9980e-03 eta 3 days, 6:26:47
epoch [7/50] batch [1820/2000] time 4.575 (3.295) data 0.001 (0.001) loss 2.4542 (1.2839) lr 1.9980e-03 eta 3 days, 6:52:31
epoch [7/50] batch [1840/2000] time 5.712 (3.313) data 0.000 (0.001) loss 0.7068 (1.2842) lr 1.9980e-03 eta 3 days, 7:17:18
epoch [7/50] batch [1860/2000] time 4.530 (3.335) data 0.000 (0.001) loss 1.8036 (1.2886) lr 1.9980e-03 eta 3 days, 7:47:19
epoch [7/50] batch [1880/2000] time 6.072 (3.355) data 0.000 (0.001) loss 2.9840 (1.2878) lr 1.9980e-03 eta 3 days, 8:15:03
epoch [7/50] batch [1900/2000] time 6.025 (3.381) data 0.001 (0.001) loss 0.1925 (1.2863) lr 1.9980e-03 eta 3 days, 8:51:05
epoch [7/50] batch [1920/2000] time 4.671 (3.400) data 0.000 (0.001) loss 2.2877 (1.2880) lr 1.9980e-03 eta 3 days, 9:18:31
epoch [7/50] batch [1940/2000] time 4.588 (3.418) data 0.000 (0.001) loss 2.5199 (1.2884) lr 1.9980e-03 eta 3 days, 9:41:55
epoch [7/50] batch [1960/2000] time 4.581 (3.431) data 0.000 (0.001) loss 0.4825 (1.2900) lr 1.9980e-03 eta 3 days, 10:00:11
epoch [7/50] batch [1980/2000] time 4.801 (3.445) data 0.000 (0.001) loss 0.5648 (1.2886) lr 1.9980e-03 eta 3 days, 10:18:47
epoch [7/50] batch [2000/2000] time 4.573 (3.459) data 0.000 (0.001) loss 0.6297 (1.2911) lr 1.9921e-03 eta 3 days, 10:37:39
epoch [8/50] batch [20/2000] time 6.034 (5.533) data 0.000 (0.033) loss 1.6349 (1.0734) lr 1.9921e-03 eta 5 days, 12:09:23
epoch [8/50] batch [40/2000] time 5.958 (5.635) data 0.000 (0.017) loss 2.5320 (1.2560) lr 1.9921e-03 eta 5 days, 14:32:53
epoch [8/50] batch [60/2000] time 6.131 (5.662) data 0.001 (0.011) loss 0.2651 (1.2255) lr 1.9921e-03 eta 5 days, 15:10:00
epoch [8/50] batch [80/2000] time 4.542 (5.475) data 0.000 (0.009) loss 1.5145 (1.2562) lr 1.9921e-03 eta 5 days, 10:39:46
epoch [8/50] batch [100/2000] time 5.590 (5.386) data 0.000 (0.007) loss 0.3294 (1.2504) lr 1.9921e-03 eta 5 days, 8:31:09
epoch [8/50] batch [120/2000] time 4.683 (5.352) data 0.000 (0.006) loss 4.3640 (1.3130) lr 1.9921e-03 eta 5 days, 7:39:52
epoch [8/50] batch [140/2000] time 5.983 (5.365) data 0.000 (0.005) loss 1.2265 (1.3276) lr 1.9921e-03 eta 5 days, 7:57:34
epoch [8/50] batch [160/2000] time 6.003 (5.427) data 0.000 (0.005) loss 0.3369 (1.3323) lr 1.9921e-03 eta 5 days, 9:23:45
epoch [8/50] batch [180/2000] time 5.994 (5.473) data 0.000 (0.004) loss 0.0690 (1.3263) lr 1.9921e-03 eta 5 days, 10:28:20
epoch [8/50] batch [200/2000] time 5.705 (5.510) data 0.000 (0.004) loss 0.8355 (1.3200) lr 1.9921e-03 eta 5 days, 11:19:16
epoch [8/50] batch [220/2000] time 5.068 (5.441) data 0.000 (0.004) loss 0.5669 (1.3069) lr 1.9921e-03 eta 5 days, 9:38:13
epoch [8/50] batch [240/2000] time 4.424 (5.406) data 0.000 (0.003) loss 0.3899 (1.3214) lr 1.9921e-03 eta 5 days, 8:46:17
epoch [8/50] batch [260/2000] time 5.761 (5.392) data 0.000 (0.003) loss 0.8799 (1.3216) lr 1.9921e-03 eta 5 days, 8:25:01
epoch [8/50] batch [280/2000] time 5.742 (5.408) data 0.000 (0.003) loss 0.1087 (1.3219) lr 1.9921e-03 eta 5 days, 8:45:31
epoch [8/50] batch [300/2000] time 4.288 (5.396) data 0.000 (0.003) loss 0.1730 (1.2878) lr 1.9921e-03 eta 5 days, 8:27:34
epoch [8/50] batch [320/2000] time 5.257 (5.391) data 0.000 (0.003) loss 2.9485 (1.3129) lr 1.9921e-03 eta 5 days, 8:18:43
epoch [8/50] batch [340/2000] time 5.750 (5.400) data 0.000 (0.003) loss 0.2256 (1.3018) lr 1.9921e-03 eta 5 days, 8:29:34
epoch [8/50] batch [360/2000] time 5.832 (5.404) data 0.000 (0.002) loss 1.5189 (1.2924) lr 1.9921e-03 eta 5 days, 8:33:58
epoch [8/50] batch [380/2000] time 5.779 (5.411) data 0.001 (0.002) loss 0.4183 (1.2896) lr 1.9921e-03 eta 5 days, 8:42:02
epoch [8/50] batch [400/2000] time 4.460 (5.378) data 0.001 (0.002) loss 0.9243 (1.2777) lr 1.9921e-03 eta 5 days, 7:53:12
epoch [8/50] batch [420/2000] time 6.212 (5.412) data 0.000 (0.002) loss 3.4787 (1.2865) lr 1.9921e-03 eta 5 days, 8:40:01
epoch [8/50] batch [440/2000] time 6.170 (5.436) data 0.000 (0.002) loss 0.0231 (1.2815) lr 1.9921e-03 eta 5 days, 9:11:48
epoch [8/50] batch [460/2000] time 4.816 (5.463) data 0.000 (0.002) loss 1.3402 (1.2712) lr 1.9921e-03 eta 5 days, 9:48:11
epoch [8/50] batch [480/2000] time 6.150 (5.492) data 0.000 (0.002) loss 0.3815 (1.2851) lr 1.9921e-03 eta 5 days, 10:27:32
epoch [8/50] batch [500/2000] time 6.213 (5.515) data 0.000 (0.002) loss 2.1313 (1.2781) lr 1.9921e-03 eta 5 days, 10:58:52
epoch [8/50] batch [520/2000] time 6.204 (5.530) data 0.005 (0.002) loss 1.0278 (1.2817) lr 1.9921e-03 eta 5 days, 11:19:06
epoch [8/50] batch [540/2000] time 6.199 (5.554) data 0.001 (0.002) loss 0.6657 (1.2802) lr 1.9921e-03 eta 5 days, 11:50:56
epoch [8/50] batch [560/2000] time 6.112 (5.571) data 0.000 (0.002) loss 0.3383 (1.2782) lr 1.9921e-03 eta 5 days, 12:13:26
epoch [8/50] batch [580/2000] time 6.213 (5.588) data 0.000 (0.002) loss 0.1570 (1.2880) lr 1.9921e-03 eta 5 days, 12:35:30
epoch [8/50] batch [600/2000] time 6.198 (5.608) data 0.001 (0.002) loss 1.4998 (1.2818) lr 1.9921e-03 eta 5 days, 13:01:37
epoch [8/50] batch [620/2000] time 6.169 (5.623) data 0.000 (0.002) loss 0.1447 (1.2720) lr 1.9921e-03 eta 5 days, 13:20:54
epoch [8/50] batch [640/2000] time 6.211 (5.636) data 0.000 (0.002) loss 0.2179 (1.2827) lr 1.9921e-03 eta 5 days, 13:38:44
epoch [8/50] batch [660/2000] time 6.354 (5.653) data 0.000 (0.002) loss 2.1573 (1.2821) lr 1.9921e-03 eta 5 days, 14:00:32
epoch [8/50] batch [680/2000] time 6.176 (5.666) data 0.000 (0.002) loss 0.3861 (1.2826) lr 1.9921e-03 eta 5 days, 14:16:32
epoch [8/50] batch [700/2000] time 6.237 (5.678) data 0.000 (0.002) loss 1.3420 (1.2821) lr 1.9921e-03 eta 5 days, 14:31:33
epoch [8/50] batch [720/2000] time 6.115 (5.691) data 0.000 (0.002) loss 0.1735 (1.2698) lr 1.9921e-03 eta 5 days, 14:49:16
epoch [8/50] batch [740/2000] time 6.197 (5.702) data 0.000 (0.002) loss 0.1404 (1.2707) lr 1.9921e-03 eta 5 days, 15:02:38
epoch [8/50] batch [760/2000] time 6.202 (5.712) data 0.000 (0.002) loss 1.3592 (1.2687) lr 1.9921e-03 eta 5 days, 15:14:14
epoch [8/50] batch [780/2000] time 6.200 (5.721) data 0.000 (0.001) loss 1.3055 (1.2647) lr 1.9921e-03 eta 5 days, 15:25:31
epoch [8/50] batch [800/2000] time 6.173 (5.732) data 0.000 (0.001) loss 0.2706 (1.2698) lr 1.9921e-03 eta 5 days, 15:39:41
epoch [8/50] batch [820/2000] time 6.198 (5.740) data 0.000 (0.001) loss 2.2933 (1.2664) lr 1.9921e-03 eta 5 days, 15:48:24
epoch [8/50] batch [840/2000] time 4.651 (5.741) data 0.000 (0.001) loss 0.1969 (1.2651) lr 1.9921e-03 eta 5 days, 15:47:52
epoch [8/50] batch [860/2000] time 4.306 (5.715) data 0.000 (0.001) loss 0.7509 (1.2711) lr 1.9921e-03 eta 5 days, 15:09:03
epoch [8/50] batch [880/2000] time 5.710 (5.693) data 0.000 (0.001) loss 1.9041 (1.2725) lr 1.9921e-03 eta 5 days, 14:36:14
epoch [8/50] batch [900/2000] time 5.965 (5.697) data 0.000 (0.001) loss 0.4576 (1.2690) lr 1.9921e-03 eta 5 days, 14:39:40
epoch [8/50] batch [920/2000] time 6.014 (5.700) data 0.000 (0.001) loss 3.0160 (1.2584) lr 1.9921e-03 eta 5 days, 14:42:55
epoch [8/50] batch [940/2000] time 5.977 (5.704) data 0.000 (0.001) loss 1.0473 (1.2624) lr 1.9921e-03 eta 5 days, 14:46:16
epoch [8/50] batch [960/2000] time 6.148 (5.707) data 0.000 (0.001) loss 3.8021 (1.2657) lr 1.9921e-03 eta 5 days, 14:48:58
epoch [8/50] batch [980/2000] time 5.958 (5.709) data 0.000 (0.001) loss 0.4385 (1.2655) lr 1.9921e-03 eta 5 days, 14:50:06
epoch [8/50] batch [1000/2000] time 5.899 (5.713) data 0.000 (0.001) loss 1.9323 (1.2692) lr 1.9921e-03 eta 5 days, 14:52:43
epoch [8/50] batch [1020/2000] time 5.767 (5.715) data 0.000 (0.001) loss 1.9906 (1.2713) lr 1.9921e-03 eta 5 days, 14:54:09
epoch [8/50] batch [1040/2000] time 4.906 (5.716) data 0.000 (0.001) loss 2.6131 (1.2698) lr 1.9921e-03 eta 5 days, 14:54:27
epoch [8/50] batch [1060/2000] time 5.985 (5.719) data 0.000 (0.001) loss 1.1281 (1.2733) lr 1.9921e-03 eta 5 days, 14:56:00
epoch [8/50] batch [1080/2000] time 4.340 (5.709) data 0.000 (0.001) loss 0.2922 (1.2783) lr 1.9921e-03 eta 5 days, 14:39:26
epoch [8/50] batch [1100/2000] time 5.276 (5.702) data 0.000 (0.001) loss 0.9115 (1.2840) lr 1.9921e-03 eta 5 days, 14:28:24
epoch [8/50] batch [1120/2000] time 5.779 (5.700) data 0.000 (0.001) loss 2.1383 (1.2854) lr 1.9921e-03 eta 5 days, 14:23:48
epoch [8/50] batch [1140/2000] time 4.338 (5.679) data 0.001 (0.001) loss 2.3727 (1.2915) lr 1.9921e-03 eta 5 days, 13:52:19
epoch [8/50] batch [1160/2000] time 4.300 (5.656) data 0.000 (0.001) loss 2.5066 (1.2957) lr 1.9921e-03 eta 5 days, 13:17:08
epoch [8/50] batch [1180/2000] time 4.310 (5.633) data 0.001 (0.001) loss 0.1032 (1.2894) lr 1.9921e-03 eta 5 days, 12:43:00
epoch [8/50] batch [1200/2000] time 4.290 (5.611) data 0.000 (0.001) loss 1.4054 (1.2888) lr 1.9921e-03 eta 5 days, 12:09:55
epoch [8/50] batch [1220/2000] time 4.251 (5.589) data 0.000 (0.001) loss 0.7300 (1.2834) lr 1.9921e-03 eta 5 days, 11:37:54
epoch [8/50] batch [1240/2000] time 4.294 (5.569) data 0.000 (0.001) loss 0.6704 (1.2813) lr 1.9921e-03 eta 5 days, 11:06:55
epoch [8/50] batch [1260/2000] time 4.417 (5.549) data 0.000 (0.001) loss 0.1805 (1.2842) lr 1.9921e-03 eta 5 days, 10:36:20
epoch [8/50] batch [1280/2000] time 4.319 (5.529) data 0.000 (0.001) loss 2.1353 (1.2863) lr 1.9921e-03 eta 5 days, 10:06:20
epoch [8/50] batch [1300/2000] time 4.321 (5.510) data 0.000 (0.001) loss 1.8675 (1.2862) lr 1.9921e-03 eta 5 days, 9:37:47
epoch [8/50] batch [1320/2000] time 4.275 (5.491) data 0.000 (0.001) loss 1.2749 (1.2867) lr 1.9921e-03 eta 5 days, 9:10:10
epoch [8/50] batch [1340/2000] time 4.262 (5.474) data 0.000 (0.001) loss 1.3107 (1.2874) lr 1.9921e-03 eta 5 days, 8:43:08
epoch [8/50] batch [1360/2000] time 4.308 (5.457) data 0.000 (0.001) loss 0.5772 (1.2851) lr 1.9921e-03 eta 5 days, 8:17:37
epoch [8/50] batch [1380/2000] time 4.347 (5.440) data 0.000 (0.001) loss 1.6222 (1.2890) lr 1.9921e-03 eta 5 days, 7:52:15
epoch [8/50] batch [1400/2000] time 3.724 (5.423) data 0.001 (0.001) loss 0.4332 (1.2887) lr 1.9921e-03 eta 5 days, 7:26:19
epoch [8/50] batch [1420/2000] time 4.312 (5.406) data 0.000 (0.001) loss 0.5816 (1.2847) lr 1.9921e-03 eta 5 days, 7:01:19
epoch [8/50] batch [1440/2000] time 4.339 (5.391) data 0.000 (0.001) loss 0.7943 (1.2890) lr 1.9921e-03 eta 5 days, 6:38:11
epoch [8/50] batch [1460/2000] time 4.326 (5.376) data 0.000 (0.001) loss 0.6404 (1.2820) lr 1.9921e-03 eta 5 days, 6:15:26
epoch [8/50] batch [1480/2000] time 4.315 (5.362) data 0.000 (0.001) loss 2.8335 (1.2866) lr 1.9921e-03 eta 5 days, 5:53:13
epoch [8/50] batch [1500/2000] time 4.334 (5.348) data 0.000 (0.001) loss 2.2246 (1.2898) lr 1.9921e-03 eta 5 days, 5:31:22
epoch [8/50] batch [1520/2000] time 4.338 (5.334) data 0.000 (0.001) loss 0.5018 (1.2896) lr 1.9921e-03 eta 5 days, 5:10:13
epoch [8/50] batch [1540/2000] time 4.330 (5.321) data 0.000 (0.001) loss 0.6987 (1.2931) lr 1.9921e-03 eta 5 days, 4:49:39
epoch [8/50] batch [1560/2000] time 4.320 (5.307) data 0.000 (0.001) loss 0.4171 (1.2945) lr 1.9921e-03 eta 5 days, 4:28:35
epoch [8/50] batch [1580/2000] time 4.300 (5.294) data 0.000 (0.001) loss 1.9003 (1.2951) lr 1.9921e-03 eta 5 days, 4:09:11
epoch [8/50] batch [1600/2000] time 4.340 (5.282) data 0.000 (0.001) loss 0.4772 (1.2906) lr 1.9921e-03 eta 5 days, 3:50:01
epoch [8/50] batch [1620/2000] time 4.305 (5.270) data 0.000 (0.001) loss 0.2994 (1.2898) lr 1.9921e-03 eta 5 days, 3:31:21
epoch [8/50] batch [1640/2000] time 4.291 (5.258) data 0.000 (0.001) loss 1.4644 (1.2902) lr 1.9921e-03 eta 5 days, 3:13:16
epoch [8/50] batch [1660/2000] time 4.320 (5.247) data 0.000 (0.001) loss 1.6714 (1.2945) lr 1.9921e-03 eta 5 days, 2:55:19
epoch [8/50] batch [1680/2000] time 4.244 (5.236) data 0.001 (0.001) loss 1.1790 (1.2950) lr 1.9921e-03 eta 5 days, 2:37:45
epoch [8/50] batch [1700/2000] time 4.455 (5.224) data 0.001 (0.001) loss 0.8576 (1.2949) lr 1.9921e-03 eta 5 days, 2:19:53
epoch [8/50] batch [1720/2000] time 4.289 (5.213) data 0.000 (0.001) loss 0.8614 (1.2933) lr 1.9921e-03 eta 5 days, 2:03:08
epoch [8/50] batch [1740/2000] time 4.271 (5.203) data 0.000 (0.001) loss 1.6614 (1.2892) lr 1.9921e-03 eta 5 days, 1:46:51
epoch [8/50] batch [1760/2000] time 4.324 (5.193) data 0.000 (0.001) loss 0.1932 (1.2873) lr 1.9921e-03 eta 5 days, 1:30:47
epoch [8/50] batch [1780/2000] time 4.281 (5.183) data 0.000 (0.001) loss 2.3960 (1.2883) lr 1.9921e-03 eta 5 days, 1:15:02
epoch [8/50] batch [1800/2000] time 4.315 (5.173) data 0.001 (0.001) loss 1.3562 (1.2919) lr 1.9921e-03 eta 5 days, 0:59:31
epoch [8/50] batch [1820/2000] time 4.308 (5.163) data 0.000 (0.001) loss 2.2770 (1.2937) lr 1.9921e-03 eta 5 days, 0:44:15
epoch [8/50] batch [1840/2000] time 4.258 (5.154) data 0.000 (0.001) loss 0.0919 (1.2918) lr 1.9921e-03 eta 5 days, 0:29:22
epoch [8/50] batch [1860/2000] time 4.417 (5.144) data 0.000 (0.001) loss 0.5750 (1.2920) lr 1.9921e-03 eta 5 days, 0:13:14
epoch [8/50] batch [1880/2000] time 2.545 (5.117) data 0.000 (0.001) loss 1.0323 (1.2916) lr 1.9921e-03 eta 4 days, 23:34:23
epoch [8/50] batch [1900/2000] time 2.861 (5.091) data 0.000 (0.001) loss 0.7713 (1.2903) lr 1.9921e-03 eta 4 days, 22:56:26
epoch [8/50] batch [1920/2000] time 2.082 (5.067) data 0.000 (0.001) loss 0.5082 (1.2855) lr 1.9921e-03 eta 4 days, 22:20:25
epoch [8/50] batch [1940/2000] time 2.117 (5.043) data 0.000 (0.001) loss 2.5729 (1.2883) lr 1.9921e-03 eta 4 days, 21:44:46
epoch [8/50] batch [1960/2000] time 3.378 (5.022) data 0.000 (0.001) loss 2.5499 (1.2867) lr 1.9921e-03 eta 4 days, 21:13:30
epoch [8/50] batch [1980/2000] time 2.421 (4.996) data 0.000 (0.001) loss 1.4212 (1.2883) lr 1.9921e-03 eta 4 days, 20:36:18
epoch [8/50] batch [2000/2000] time 3.604 (4.975) data 0.000 (0.001) loss 0.4251 (1.2881) lr 1.9823e-03 eta 4 days, 20:05:14
epoch [9/50] batch [20/2000] time 3.641 (3.563) data 0.000 (0.031) loss 1.7233 (0.9422) lr 1.9823e-03 eta 3 days, 11:06:35
epoch [9/50] batch [40/2000] time 3.852 (3.521) data 0.006 (0.016) loss 1.0151 (1.1511) lr 1.9823e-03 eta 3 days, 10:07:34
epoch [9/50] batch [60/2000] time 4.338 (3.506) data 0.001 (0.011) loss 1.8496 (1.2582) lr 1.9823e-03 eta 3 days, 9:44:15
epoch [9/50] batch [80/2000] time 2.562 (3.253) data 0.000 (0.009) loss 0.3744 (1.2059) lr 1.9823e-03 eta 3 days, 3:50:30
epoch [9/50] batch [100/2000] time 3.157 (3.126) data 0.000 (0.007) loss 1.2119 (1.1811) lr 1.9823e-03 eta 3 days, 0:51:17
epoch [9/50] batch [120/2000] time 2.399 (3.024) data 0.000 (0.006) loss 0.3124 (1.2065) lr 1.9823e-03 eta 2 days, 22:27:35
epoch [9/50] batch [140/2000] time 4.322 (3.017) data 0.000 (0.005) loss 1.5188 (1.2028) lr 1.9823e-03 eta 2 days, 22:17:16
epoch [9/50] batch [160/2000] time 2.884 (3.072) data 0.000 (0.005) loss 1.3551 (1.2797) lr 1.9823e-03 eta 2 days, 23:32:21
epoch [9/50] batch [180/2000] time 2.206 (3.027) data 0.000 (0.004) loss 0.4250 (1.2819) lr 1.9823e-03 eta 2 days, 22:28:25
epoch [9/50] batch [200/2000] time 3.674 (3.000) data 0.000 (0.004) loss 2.0572 (1.2769) lr 1.9823e-03 eta 2 days, 21:50:28
epoch [9/50] batch [220/2000] time 4.252 (3.022) data 0.000 (0.003) loss 2.9716 (1.2611) lr 1.9823e-03 eta 2 days, 22:19:05
epoch [9/50] batch [240/2000] time 4.610 (3.074) data 0.000 (0.003) loss 0.6128 (1.2539) lr 1.9823e-03 eta 2 days, 23:31:19
epoch [9/50] batch [260/2000] time 3.575 (3.122) data 0.002 (0.003) loss 0.2120 (1.2619) lr 1.9823e-03 eta 3 days, 0:37:11
epoch [9/50] batch [280/2000] time 2.012 (3.136) data 0.000 (0.003) loss 2.9951 (1.2507) lr 1.9823e-03 eta 3 days, 0:55:34
epoch [9/50] batch [300/2000] time 4.245 (3.109) data 0.000 (0.003) loss 1.7574 (1.2429) lr 1.9823e-03 eta 3 days, 0:16:28
epoch [9/50] batch [320/2000] time 4.773 (3.208) data 0.000 (0.003) loss 1.2335 (1.2603) lr 1.9823e-03 eta 3 days, 2:34:06
epoch [9/50] batch [340/2000] time 4.072 (3.257) data 0.000 (0.002) loss 0.5012 (1.2742) lr 1.9823e-03 eta 3 days, 3:41:56
epoch [9/50] batch [360/2000] time 4.761 (3.300) data 0.000 (0.002) loss 0.4665 (1.2743) lr 1.9823e-03 eta 3 days, 4:40:39
epoch [9/50] batch [380/2000] time 4.243 (3.353) data 0.000 (0.002) loss 2.6696 (1.2633) lr 1.9823e-03 eta 3 days, 5:52:34
epoch [9/50] batch [400/2000] time 4.956 (3.390) data 0.000 (0.002) loss 1.9236 (1.2587) lr 1.9823e-03 eta 3 days, 6:43:13
epoch [9/50] batch [420/2000] time 4.008 (3.421) data 0.000 (0.002) loss 0.5761 (1.2513) lr 1.9823e-03 eta 3 days, 7:24:52
epoch [9/50] batch [440/2000] time 3.910 (3.457) data 0.000 (0.002) loss 1.8220 (1.2508) lr 1.9823e-03 eta 3 days, 8:14:18
epoch [9/50] batch [460/2000] time 6.229 (3.491) data 0.000 (0.002) loss 0.0399 (1.2496) lr 1.9823e-03 eta 3 days, 9:00:32
epoch [9/50] batch [480/2000] time 2.294 (3.530) data 0.000 (0.002) loss 0.0339 (1.2459) lr 1.9823e-03 eta 3 days, 9:54:02
epoch [9/50] batch [500/2000] time 4.058 (3.590) data 0.000 (0.002) loss 0.5193 (1.2417) lr 1.9823e-03 eta 3 days, 11:16:01
epoch [9/50] batch [520/2000] time 6.344 (3.636) data 0.000 (0.002) loss 2.6635 (1.2542) lr 1.9823e-03 eta 3 days, 12:19:25
epoch [9/50] batch [540/2000] time 2.780 (3.686) data 0.000 (0.002) loss 2.1000 (1.2578) lr 1.9823e-03 eta 3 days, 13:26:57
epoch [9/50] batch [560/2000] time 5.570 (3.774) data 0.006 (0.002) loss 5.0866 (1.2596) lr 1.9823e-03 eta 3 days, 15:28:54
epoch [9/50] batch [580/2000] time 7.783 (3.858) data 0.001 (0.002) loss 1.1339 (1.2605) lr 1.9823e-03 eta 3 days, 17:23:24
epoch [9/50] batch [600/2000] time 4.210 (3.910) data 0.010 (0.002) loss 0.8008 (1.2487) lr 1.9823e-03 eta 3 days, 18:34:28
epoch [9/50] batch [620/2000] time 8.367 (4.022) data 0.001 (0.002) loss 0.4246 (1.2401) lr 1.9823e-03 eta 3 days, 21:08:44
epoch [9/50] batch [640/2000] time 5.011 (4.088) data 0.000 (0.002) loss 0.8907 (1.2273) lr 1.9823e-03 eta 3 days, 22:38:59
epoch [9/50] batch [660/2000] time 5.617 (4.113) data 0.000 (0.002) loss 2.0657 (1.2267) lr 1.9823e-03 eta 3 days, 23:12:43
epoch [9/50] batch [680/2000] time 8.069 (4.156) data 0.000 (0.002) loss 0.4136 (1.2244) lr 1.9823e-03 eta 4 days, 0:11:59
epoch [9/50] batch [700/2000] time 7.726 (4.240) data 0.000 (0.002) loss 0.7865 (1.2389) lr 1.9823e-03 eta 4 days, 2:05:50
epoch [9/50] batch [720/2000] time 5.282 (4.310) data 0.000 (0.002) loss 1.8495 (1.2381) lr 1.9823e-03 eta 4 days, 3:42:01
epoch [9/50] batch [740/2000] time 6.162 (4.372) data 0.000 (0.002) loss 0.6944 (1.2378) lr 1.9823e-03 eta 4 days, 5:06:57
epoch [9/50] batch [760/2000] time 7.752 (4.439) data 0.000 (0.002) loss 0.7774 (1.2381) lr 1.9823e-03 eta 4 days, 6:37:48
epoch [9/50] batch [780/2000] time 3.937 (4.455) data 0.001 (0.002) loss 0.0103 (1.2324) lr 1.9823e-03 eta 4 days, 6:59:15
epoch [9/50] batch [800/2000] time 4.035 (4.460) data 0.000 (0.002) loss 1.6617 (1.2309) lr 1.9823e-03 eta 4 days, 7:05:07
epoch [9/50] batch [820/2000] time 3.859 (4.466) data 0.000 (0.002) loss 0.9434 (1.2303) lr 1.9823e-03 eta 4 days, 7:10:45
epoch [9/50] batch [840/2000] time 3.928 (4.472) data 0.001 (0.002) loss 0.1207 (1.2262) lr 1.9823e-03 eta 4 days, 7:18:37
epoch [9/50] batch [860/2000] time 3.951 (4.480) data 0.000 (0.002) loss 0.8155 (1.2283) lr 1.9823e-03 eta 4 days, 7:28:11
epoch [9/50] batch [880/2000] time 5.684 (4.457) data 0.003 (0.002) loss 2.8081 (1.2388) lr 1.9823e-03 eta 4 days, 6:55:04
epoch [9/50] batch [900/2000] time 2.364 (4.427) data 0.002 (0.002) loss 1.1800 (1.2400) lr 1.9823e-03 eta 4 days, 6:11:13
epoch [9/50] batch [920/2000] time 3.705 (4.430) data 0.001 (0.002) loss 0.6492 (1.2340) lr 1.9823e-03 eta 4 days, 6:14:10
epoch [9/50] batch [940/2000] time 4.028 (4.409) data 0.001 (0.002) loss 0.4725 (1.2325) lr 1.9823e-03 eta 4 days, 5:43:59
epoch [9/50] batch [960/2000] time 4.300 (4.372) data 0.001 (0.001) loss 0.5437 (1.2263) lr 1.9823e-03 eta 4 days, 4:50:31
epoch [9/50] batch [980/2000] time 2.454 (4.355) data 0.000 (0.001) loss 1.6686 (1.2287) lr 1.9823e-03 eta 4 days, 4:26:26
epoch [9/50] batch [1000/2000] time 3.628 (4.333) data 0.005 (0.001) loss 1.0252 (1.2339) lr 1.9823e-03 eta 4 days, 3:53:35
epoch [9/50] batch [1020/2000] time 4.079 (4.314) data 0.000 (0.001) loss 0.6557 (1.2288) lr 1.9823e-03 eta 4 days, 3:26:06
epoch [9/50] batch [1040/2000] time 3.828 (4.295) data 0.001 (0.001) loss 0.9042 (1.2363) lr 1.9823e-03 eta 4 days, 2:58:27
epoch [9/50] batch [1060/2000] time 3.232 (4.265) data 0.000 (0.001) loss 0.7079 (1.2346) lr 1.9823e-03 eta 4 days, 2:15:46
epoch [9/50] batch [1080/2000] time 4.636 (4.250) data 0.000 (0.001) loss 0.5617 (1.2391) lr 1.9823e-03 eta 4 days, 1:53:24
epoch [9/50] batch [1100/2000] time 4.453 (4.255) data 0.000 (0.001) loss 0.1886 (1.2406) lr 1.9823e-03 eta 4 days, 1:58:40
epoch [9/50] batch [1120/2000] time 4.300 (4.259) data 0.001 (0.001) loss 1.2567 (1.2365) lr 1.9823e-03 eta 4 days, 2:03:37
epoch [9/50] batch [1140/2000] time 4.228 (4.264) data 0.001 (0.001) loss 0.3949 (1.2398) lr 1.9823e-03 eta 4 days, 2:09:13
epoch [9/50] batch [1160/2000] time 4.198 (4.269) data 0.000 (0.001) loss 0.0773 (1.2407) lr 1.9823e-03 eta 4 days, 2:13:46
epoch [9/50] batch [1180/2000] time 4.321 (4.274) data 0.000 (0.001) loss 0.6277 (1.2393) lr 1.9823e-03 eta 4 days, 2:19:47
epoch [9/50] batch [1200/2000] time 5.659 (4.280) data 0.001 (0.001) loss 1.1095 (1.2392) lr 1.9823e-03 eta 4 days, 2:26:04
epoch [9/50] batch [1220/2000] time 4.535 (4.283) data 0.000 (0.001) loss 1.8899 (1.2420) lr 1.9823e-03 eta 4 days, 2:29:06
epoch [9/50] batch [1240/2000] time 4.347 (4.289) data 0.000 (0.001) loss 4.0954 (1.2425) lr 1.9823e-03 eta 4 days, 2:35:31
epoch [9/50] batch [1260/2000] time 4.272 (4.294) data 0.001 (0.001) loss 2.9344 (1.2422) lr 1.9823e-03 eta 4 days, 2:41:32
epoch [9/50] batch [1280/2000] time 4.280 (4.302) data 0.000 (0.001) loss 1.7311 (1.2380) lr 1.9823e-03 eta 4 days, 2:51:27
epoch [9/50] batch [1300/2000] time 6.501 (4.310) data 0.001 (0.001) loss 0.8336 (1.2452) lr 1.9823e-03 eta 4 days, 3:01:14
epoch [9/50] batch [1320/2000] time 4.643 (4.316) data 0.000 (0.001) loss 0.1174 (1.2459) lr 1.9823e-03 eta 4 days, 3:07:30
epoch [9/50] batch [1340/2000] time 5.069 (4.321) data 0.001 (0.001) loss 1.8572 (1.2475) lr 1.9823e-03 eta 4 days, 3:13:18
epoch [9/50] batch [1360/2000] time 2.963 (4.325) data 0.000 (0.001) loss 0.9150 (1.2462) lr 1.9823e-03 eta 4 days, 3:16:51
epoch [9/50] batch [1380/2000] time 5.003 (4.329) data 0.000 (0.001) loss 0.5834 (1.2496) lr 1.9823e-03 eta 4 days, 3:20:32
epoch [9/50] batch [1400/2000] time 5.241 (4.336) data 0.000 (0.001) loss 3.2882 (1.2501) lr 1.9823e-03 eta 4 days, 3:28:58
epoch [9/50] batch [1420/2000] time 4.506 (4.341) data 0.006 (0.001) loss 1.6714 (1.2536) lr 1.9823e-03 eta 4 days, 3:34:47
epoch [9/50] batch [1440/2000] time 4.654 (4.348) data 0.001 (0.001) loss 1.3976 (1.2574) lr 1.9823e-03 eta 4 days, 3:42:17
epoch [9/50] batch [1460/2000] time 5.067 (4.354) data 0.000 (0.001) loss 1.3057 (1.2573) lr 1.9823e-03 eta 4 days, 3:50:12
epoch [9/50] batch [1480/2000] time 5.201 (4.361) data 0.001 (0.001) loss 0.6811 (1.2578) lr 1.9823e-03 eta 4 days, 3:57:27
epoch [9/50] batch [1500/2000] time 4.228 (4.365) data 0.000 (0.001) loss 0.6381 (1.2572) lr 1.9823e-03 eta 4 days, 4:01:42
epoch [9/50] batch [1520/2000] time 4.148 (4.368) data 0.000 (0.001) loss 0.2287 (1.2611) lr 1.9823e-03 eta 4 days, 4:05:03
epoch [9/50] batch [1540/2000] time 4.121 (4.372) data 0.000 (0.001) loss 2.5252 (1.2622) lr 1.9823e-03 eta 4 days, 4:08:36
epoch [9/50] batch [1560/2000] time 4.420 (4.377) data 0.000 (0.001) loss 0.4546 (1.2604) lr 1.9823e-03 eta 4 days, 4:14:24
epoch [9/50] batch [1580/2000] time 4.397 (4.379) data 0.002 (0.001) loss 2.0926 (1.2609) lr 1.9823e-03 eta 4 days, 4:15:24
epoch [9/50] batch [1600/2000] time 4.313 (4.381) data 0.000 (0.001) loss 2.0211 (1.2584) lr 1.9823e-03 eta 4 days, 4:16:57
epoch [9/50] batch [1620/2000] time 5.771 (4.384) data 0.003 (0.001) loss 0.8068 (1.2600) lr 1.9823e-03 eta 4 days, 4:18:45
epoch [9/50] batch [1640/2000] time 4.362 (4.385) data 0.000 (0.001) loss 0.3392 (1.2581) lr 1.9823e-03 eta 4 days, 4:19:22
epoch [9/50] batch [1660/2000] time 4.393 (4.388) data 0.004 (0.001) loss 0.7442 (1.2601) lr 1.9823e-03 eta 4 days, 4:21:20
epoch [9/50] batch [1680/2000] time 4.311 (4.387) data 0.001 (0.001) loss 1.0142 (1.2608) lr 1.9823e-03 eta 4 days, 4:18:20
epoch [9/50] batch [1700/2000] time 4.298 (4.385) data 0.000 (0.001) loss 0.2234 (1.2621) lr 1.9823e-03 eta 4 days, 4:15:10
epoch [9/50] batch [1720/2000] time 4.240 (4.384) data 0.000 (0.001) loss 0.2580 (1.2592) lr 1.9823e-03 eta 4 days, 4:12:08
epoch [9/50] batch [1740/2000] time 4.306 (4.383) data 0.000 (0.001) loss 0.8337 (1.2592) lr 1.9823e-03 eta 4 days, 4:09:15
epoch [9/50] batch [1760/2000] time 4.330 (4.382) data 0.000 (0.001) loss 3.1146 (1.2573) lr 1.9823e-03 eta 4 days, 4:06:21
epoch [9/50] batch [1780/2000] time 4.315 (4.381) data 0.000 (0.001) loss 0.9015 (1.2577) lr 1.9823e-03 eta 4 days, 4:03:37
epoch [9/50] batch [1800/2000] time 4.332 (4.380) data 0.000 (0.001) loss 0.1639 (1.2547) lr 1.9823e-03 eta 4 days, 4:00:56
epoch [9/50] batch [1820/2000] time 4.370 (4.379) data 0.000 (0.001) loss 1.9337 (1.2553) lr 1.9823e-03 eta 4 days, 3:57:36
epoch [9/50] batch [1840/2000] time 4.335 (4.377) data 0.000 (0.001) loss 1.5316 (1.2581) lr 1.9823e-03 eta 4 days, 3:54:09
epoch [9/50] batch [1860/2000] time 4.295 (4.377) data 0.000 (0.001) loss 0.9612 (1.2565) lr 1.9823e-03 eta 4 days, 3:51:25
epoch [9/50] batch [1880/2000] time 4.265 (4.376) data 0.000 (0.001) loss 1.1696 (1.2605) lr 1.9823e-03 eta 4 days, 3:48:36
epoch [9/50] batch [1900/2000] time 4.290 (4.375) data 0.000 (0.001) loss 0.1013 (1.2596) lr 1.9823e-03 eta 4 days, 3:45:53
epoch [9/50] batch [1920/2000] time 4.265 (4.374) data 0.000 (0.001) loss 0.7352 (1.2619) lr 1.9823e-03 eta 4 days, 3:43:01
epoch [9/50] batch [1940/2000] time 4.292 (4.373) data 0.001 (0.001) loss 1.1664 (1.2618) lr 1.9823e-03 eta 4 days, 3:40:13
epoch [9/50] batch [1960/2000] time 4.183 (4.372) data 0.000 (0.001) loss 0.6527 (1.2597) lr 1.9823e-03 eta 4 days, 3:37:24
epoch [9/50] batch [1980/2000] time 4.292 (4.369) data 0.000 (0.001) loss 0.5633 (1.2586) lr 1.9823e-03 eta 4 days, 3:32:50
epoch [9/50] batch [2000/2000] time 4.241 (4.368) data 0.000 (0.001) loss 0.7312 (1.2612) lr 1.9686e-03 eta 4 days, 3:30:09
epoch [10/50] batch [20/2000] time 4.269 (4.330) data 0.000 (0.038) loss 0.8689 (1.2828) lr 1.9686e-03 eta 4 days, 2:36:04
epoch [10/50] batch [40/2000] time 4.236 (4.307) data 0.000 (0.019) loss 1.0715 (1.3980) lr 1.9686e-03 eta 4 days, 2:03:05
epoch [10/50] batch [60/2000] time 4.294 (4.303) data 0.001 (0.013) loss 1.8007 (1.3563) lr 1.9686e-03 eta 4 days, 1:56:58
epoch [10/50] batch [80/2000] time 4.268 (4.302) data 0.000 (0.010) loss 0.6824 (1.3545) lr 1.9686e-03 eta 4 days, 1:53:25
epoch [10/50] batch [100/2000] time 4.245 (4.299) data 0.000 (0.008) loss 0.2186 (1.3212) lr 1.9686e-03 eta 4 days, 1:47:40
epoch [10/50] batch [120/2000] time 4.253 (4.265) data 0.000 (0.007) loss 1.3652 (1.3111) lr 1.9686e-03 eta 4 days, 1:00:01
epoch [10/50] batch [140/2000] time 4.324 (4.267) data 0.000 (0.006) loss 1.5662 (1.3428) lr 1.9686e-03 eta 4 days, 1:01:18
epoch [10/50] batch [160/2000] time 4.286 (4.268) data 0.001 (0.005) loss 1.2904 (1.2984) lr 1.9686e-03 eta 4 days, 1:02:12
epoch [10/50] batch [180/2000] time 4.307 (4.270) data 0.000 (0.005) loss 0.1624 (1.2876) lr 1.9686e-03 eta 4 days, 1:02:13
epoch [10/50] batch [200/2000] time 4.319 (4.271) data 0.000 (0.004) loss 0.7647 (1.3162) lr 1.9686e-03 eta 4 days, 1:02:54
epoch [10/50] batch [220/2000] time 4.274 (4.271) data 0.002 (0.004) loss 2.5952 (1.3239) lr 1.9686e-03 eta 4 days, 1:01:58
epoch [10/50] batch [240/2000] time 4.312 (4.272) data 0.000 (0.004) loss 0.6895 (1.3117) lr 1.9686e-03 eta 4 days, 1:01:27
epoch [10/50] batch [260/2000] time 4.417 (4.266) data 0.000 (0.003) loss 0.6331 (1.2878) lr 1.9686e-03 eta 4 days, 0:51:21
epoch [10/50] batch [280/2000] time 4.262 (4.262) data 0.000 (0.003) loss 1.5586 (1.2827) lr 1.9686e-03 eta 4 days, 0:45:19
epoch [10/50] batch [300/2000] time 4.303 (4.264) data 0.000 (0.003) loss 0.8279 (1.2938) lr 1.9686e-03 eta 4 days, 0:46:12
epoch [10/50] batch [320/2000] time 4.309 (4.265) data 0.000 (0.003) loss 1.7534 (1.2910) lr 1.9686e-03 eta 4 days, 0:46:43
epoch [10/50] batch [340/2000] time 4.324 (4.267) data 0.000 (0.003) loss 0.0497 (1.2850) lr 1.9686e-03 eta 4 days, 0:47:13
epoch [10/50] batch [360/2000] time 4.290 (4.268) data 0.000 (0.003) loss 1.0210 (1.2939) lr 1.9686e-03 eta 4 days, 0:47:22
epoch [10/50] batch [380/2000] time 4.274 (4.269) data 0.000 (0.002) loss 0.4204 (1.3017) lr 1.9686e-03 eta 4 days, 0:47:49
epoch [10/50] batch [400/2000] time 4.288 (4.270) data 0.000 (0.002) loss 1.5228 (1.2890) lr 1.9686e-03 eta 4 days, 0:47:38
epoch [10/50] batch [420/2000] time 4.231 (4.265) data 0.000 (0.002) loss 0.2527 (1.2953) lr 1.9686e-03 eta 4 days, 0:38:45
epoch [10/50] batch [440/2000] time 4.258 (4.266) data 0.000 (0.002) loss 0.0591 (1.2857) lr 1.9686e-03 eta 4 days, 0:38:27
epoch [10/50] batch [460/2000] time 4.315 (4.267) data 0.000 (0.002) loss 0.3528 (1.2997) lr 1.9686e-03 eta 4 days, 0:38:32
epoch [10/50] batch [480/2000] time 4.288 (4.268) data 0.000 (0.002) loss 2.6267 (1.2971) lr 1.9686e-03 eta 4 days, 0:39:04
epoch [10/50] batch [500/2000] time 4.250 (4.269) data 0.000 (0.002) loss 1.6006 (1.2879) lr 1.9686e-03 eta 4 days, 0:38:57
epoch [10/50] batch [520/2000] time 4.298 (4.270) data 0.000 (0.002) loss 1.0928 (1.2855) lr 1.9686e-03 eta 4 days, 0:38:31
epoch [10/50] batch [540/2000] time 4.237 (4.271) data 0.000 (0.002) loss 0.6870 (1.2754) lr 1.9686e-03 eta 4 days, 0:38:01
epoch [10/50] batch [560/2000] time 4.392 (4.269) data 0.000 (0.002) loss 0.4422 (1.2768) lr 1.9686e-03 eta 4 days, 0:34:09
epoch [10/50] batch [580/2000] time 4.320 (4.269) data 0.000 (0.002) loss 2.6148 (1.2822) lr 1.9686e-03 eta 4 days, 0:33:28
epoch [10/50] batch [600/2000] time 4.311 (4.270) data 0.001 (0.002) loss 0.9104 (1.2858) lr 1.9686e-03 eta 4 days, 0:33:10
epoch [10/50] batch [620/2000] time 4.339 (4.271) data 0.000 (0.002) loss 1.1671 (1.2795) lr 1.9686e-03 eta 4 days, 0:32:41
epoch [10/50] batch [640/2000] time 4.323 (4.272) data 0.000 (0.002) loss 0.0760 (1.2685) lr 1.9686e-03 eta 4 days, 0:33:06
epoch [10/50] batch [660/2000] time 4.286 (4.273) data 0.000 (0.002) loss 2.1142 (1.2726) lr 1.9686e-03 eta 4 days, 0:33:01
epoch [10/50] batch [680/2000] time 4.307 (4.274) data 0.000 (0.002) loss 0.3275 (1.2724) lr 1.9686e-03 eta 4 days, 0:32:45
epoch [10/50] batch [700/2000] time 4.289 (4.275) data 0.000 (0.002) loss 0.0871 (1.2677) lr 1.9686e-03 eta 4 days, 0:32:29
epoch [10/50] batch [720/2000] time 4.329 (4.274) data 0.000 (0.002) loss 0.4196 (1.2654) lr 1.9686e-03 eta 4 days, 0:29:28
epoch [10/50] batch [740/2000] time 4.326 (4.275) data 0.003 (0.001) loss 3.2448 (1.2691) lr 1.9686e-03 eta 4 days, 0:29:28
epoch [10/50] batch [760/2000] time 4.278 (4.276) data 0.000 (0.001) loss 0.2929 (1.2684) lr 1.9686e-03 eta 4 days, 0:29:19
epoch [10/50] batch [780/2000] time 4.255 (4.276) data 0.000 (0.001) loss 2.6282 (1.2745) lr 1.9686e-03 eta 4 days, 0:28:28
epoch [10/50] batch [800/2000] time 4.257 (4.277) data 0.000 (0.001) loss 0.5550 (1.2659) lr 1.9686e-03 eta 4 days, 0:27:36
epoch [10/50] batch [820/2000] time 4.250 (4.277) data 0.000 (0.001) loss 0.5637 (1.2635) lr 1.9686e-03 eta 4 days, 0:26:37
epoch [10/50] batch [840/2000] time 4.323 (4.277) data 0.000 (0.001) loss 0.4801 (1.2651) lr 1.9686e-03 eta 4 days, 0:25:41
epoch [10/50] batch [860/2000] time 4.404 (4.277) data 0.000 (0.001) loss 0.4308 (1.2681) lr 1.9686e-03 eta 4 days, 0:23:58
epoch [10/50] batch [880/2000] time 2.075 (4.259) data 0.000 (0.001) loss 0.9602 (1.2685) lr 1.9686e-03 eta 3 days, 23:58:08
epoch [10/50] batch [900/2000] time 4.343 (4.229) data 0.000 (0.001) loss 0.4903 (1.2654) lr 1.9686e-03 eta 3 days, 23:16:00
epoch [10/50] batch [920/2000] time 3.167 (4.198) data 0.000 (0.001) loss 0.3209 (1.2670) lr 1.9686e-03 eta 3 days, 22:32:49
epoch [10/50] batch [940/2000] time 2.648 (4.169) data 0.000 (0.001) loss 1.5735 (1.2652) lr 1.9686e-03 eta 3 days, 21:52:31
epoch [10/50] batch [960/2000] time 2.051 (4.133) data 0.000 (0.001) loss 2.0154 (1.2682) lr 1.9686e-03 eta 3 days, 21:02:22
epoch [10/50] batch [980/2000] time 3.680 (4.108) data 0.000 (0.001) loss 3.5118 (1.2741) lr 1.9686e-03 eta 3 days, 20:27:30
epoch [10/50] batch [1000/2000] time 2.198 (4.090) data 0.000 (0.001) loss 0.3889 (1.2731) lr 1.9686e-03 eta 3 days, 20:01:38
epoch [10/50] batch [1020/2000] time 3.721 (4.076) data 0.000 (0.001) loss 0.4051 (1.2744) lr 1.9686e-03 eta 3 days, 19:41:27
epoch [10/50] batch [1040/2000] time 2.084 (4.042) data 0.000 (0.001) loss 1.6063 (1.2714) lr 1.9686e-03 eta 3 days, 18:54:13
epoch [10/50] batch [1060/2000] time 2.508 (4.017) data 0.000 (0.001) loss 0.2563 (1.2676) lr 1.9686e-03 eta 3 days, 18:18:34
epoch [10/50] batch [1080/2000] time 2.139 (3.983) data 0.000 (0.001) loss 1.6343 (1.2639) lr 1.9686e-03 eta 3 days, 17:31:38
epoch [10/50] batch [1100/2000] time 3.681 (3.969) data 0.001 (0.001) loss 1.4011 (1.2625) lr 1.9686e-03 eta 3 days, 17:11:28
epoch [10/50] batch [1120/2000] time 3.065 (3.956) data 0.000 (0.001) loss 0.1456 (1.2635) lr 1.9686e-03 eta 3 days, 16:52:32
epoch [10/50] batch [1140/2000] time 2.026 (3.937) data 0.001 (0.001) loss 1.6755 (1.2646) lr 1.9686e-03 eta 3 days, 16:25:30
epoch [10/50] batch [1160/2000] time 2.607 (3.919) data 0.000 (0.001) loss 3.1327 (1.2677) lr 1.9686e-03 eta 3 days, 16:00:44
epoch [10/50] batch [1180/2000] time 2.157 (3.907) data 0.000 (0.001) loss 1.2853 (1.2662) lr 1.9686e-03 eta 3 days, 15:42:12
epoch [10/50] batch [1200/2000] time 3.662 (3.896) data 0.000 (0.001) loss 0.6310 (1.2670) lr 1.9686e-03 eta 3 days, 15:27:00
epoch [10/50] batch [1220/2000] time 2.008 (3.875) data 0.000 (0.001) loss 0.1129 (1.2619) lr 1.9686e-03 eta 3 days, 14:56:45
epoch [10/50] batch [1240/2000] time 4.116 (3.856) data 0.000 (0.001) loss 1.6301 (1.2578) lr 1.9686e-03 eta 3 days, 14:30:27
epoch [10/50] batch [1260/2000] time 4.098 (3.860) data 0.000 (0.001) loss 2.2427 (1.2589) lr 1.9686e-03 eta 3 days, 14:34:22
epoch [10/50] batch [1280/2000] time 4.164 (3.861) data 0.000 (0.001) loss 1.0354 (1.2593) lr 1.9686e-03 eta 3 days, 14:34:06
epoch [10/50] batch [1300/2000] time 4.145 (3.861) data 0.000 (0.001) loss 2.3726 (1.2615) lr 1.9686e-03 eta 3 days, 14:33:03
epoch [10/50] batch [1320/2000] time 4.110 (3.865) data 0.000 (0.001) loss 1.3465 (1.2632) lr 1.9686e-03 eta 3 days, 14:37:07
epoch [10/50] batch [1340/2000] time 4.144 (3.865) data 0.000 (0.001) loss 1.7919 (1.2614) lr 1.9686e-03 eta 3 days, 14:36:02
epoch [10/50] batch [1360/2000] time 4.160 (3.866) data 0.000 (0.001) loss 1.0722 (1.2596) lr 1.9686e-03 eta 3 days, 14:35:16
epoch [10/50] batch [1380/2000] time 2.523 (3.868) data 0.000 (0.001) loss 1.8848 (1.2612) lr 1.9686e-03 eta 3 days, 14:37:14
epoch [10/50] batch [1400/2000] time 4.115 (3.869) data 0.000 (0.001) loss 0.6678 (1.2620) lr 1.9686e-03 eta 3 days, 14:37:53
epoch [10/50] batch [1420/2000] time 4.112 (3.870) data 0.000 (0.001) loss 1.5794 (1.2579) lr 1.9686e-03 eta 3 days, 14:36:53
epoch [10/50] batch [1440/2000] time 2.615 (3.871) data 0.000 (0.001) loss 1.5833 (1.2615) lr 1.9686e-03 eta 3 days, 14:37:02
epoch [10/50] batch [1460/2000] time 4.025 (3.873) data 0.000 (0.001) loss 2.1884 (1.2667) lr 1.9686e-03 eta 3 days, 14:38:29
epoch [10/50] batch [1480/2000] time 4.144 (3.873) data 0.000 (0.001) loss 0.5726 (1.2608) lr 1.9686e-03 eta 3 days, 14:38:13
epoch [10/50] batch [1500/2000] time 4.097 (3.874) data 0.000 (0.001) loss 1.6022 (1.2598) lr 1.9686e-03 eta 3 days, 14:38:13
epoch [10/50] batch [1520/2000] time 4.138 (3.878) data 0.000 (0.001) loss 1.1229 (1.2612) lr 1.9686e-03 eta 3 days, 14:41:19
epoch [10/50] batch [1540/2000] time 2.289 (3.866) data 0.000 (0.001) loss 2.3333 (1.2618) lr 1.9686e-03 eta 3 days, 14:24:28
epoch [10/50] batch [1560/2000] time 2.166 (3.848) data 0.000 (0.001) loss 0.3565 (1.2606) lr 1.9686e-03 eta 3 days, 13:58:39
epoch [10/50] batch [1580/2000] time 3.495 (3.837) data 0.000 (0.001) loss 2.9907 (1.2565) lr 1.9686e-03 eta 3 days, 13:42:30
epoch [10/50] batch [1600/2000] time 2.182 (3.833) data 0.000 (0.001) loss 1.0447 (1.2510) lr 1.9686e-03 eta 3 days, 13:36:47
epoch [10/50] batch [1620/2000] time 2.974 (3.831) data 0.000 (0.001) loss 2.8399 (1.2499) lr 1.9686e-03 eta 3 days, 13:32:51
epoch [10/50] batch [1640/2000] time 3.250 (3.830) data 0.000 (0.001) loss 2.2414 (1.2494) lr 1.9686e-03 eta 3 days, 13:29:00
epoch [10/50] batch [1660/2000] time 3.636 (3.828) data 0.000 (0.001) loss 0.6479 (1.2507) lr 1.9686e-03 eta 3 days, 13:25:13
epoch [10/50] batch [1680/2000] time 3.443 (3.825) data 0.001 (0.001) loss 0.4410 (1.2508) lr 1.9686e-03 eta 3 days, 13:20:52
epoch [10/50] batch [1700/2000] time 3.475 (3.823) data 0.000 (0.001) loss 0.8453 (1.2509) lr 1.9686e-03 eta 3 days, 13:16:46
epoch [10/50] batch [1720/2000] time 2.320 (3.820) data 0.000 (0.001) loss 1.3352 (1.2514) lr 1.9686e-03 eta 3 days, 13:11:29
epoch [10/50] batch [1740/2000] time 2.622 (3.818) data 0.000 (0.001) loss 1.1906 (1.2551) lr 1.9686e-03 eta 3 days, 13:07:38
epoch [10/50] batch [1760/2000] time 2.741 (3.816) data 0.000 (0.001) loss 1.8618 (1.2578) lr 1.9686e-03 eta 3 days, 13:03:40
epoch [10/50] batch [1780/2000] time 2.069 (3.807) data 0.000 (0.001) loss 0.3098 (1.2568) lr 1.9686e-03 eta 3 days, 12:49:38
epoch [10/50] batch [1800/2000] time 3.712 (3.794) data 0.000 (0.001) loss 0.2627 (1.2547) lr 1.9686e-03 eta 3 days, 12:31:32
epoch [10/50] batch [1820/2000] time 2.664 (3.788) data 0.000 (0.001) loss 1.9555 (1.2523) lr 1.9686e-03 eta 3 days, 12:22:23
epoch [10/50] batch [1840/2000] time 3.011 (3.784) data 0.000 (0.001) loss 0.4009 (1.2536) lr 1.9686e-03 eta 3 days, 12:14:53
epoch [10/50] batch [1860/2000] time 2.092 (3.769) data 0.000 (0.001) loss 0.5778 (1.2510) lr 1.9686e-03 eta 3 days, 11:54:20
epoch [10/50] batch [1880/2000] time 2.076 (3.755) data 0.000 (0.001) loss 1.0393 (1.2517) lr 1.9686e-03 eta 3 days, 11:33:33
epoch [10/50] batch [1900/2000] time 3.625 (3.739) data 0.000 (0.001) loss 1.6170 (1.2543) lr 1.9686e-03 eta 3 days, 11:12:01
epoch [10/50] batch [1920/2000] time 3.684 (3.734) data 0.000 (0.001) loss 0.8368 (1.2553) lr 1.9686e-03 eta 3 days, 11:03:09
epoch [10/50] batch [1940/2000] time 3.759 (3.728) data 0.000 (0.001) loss 3.1829 (1.2576) lr 1.9686e-03 eta 3 days, 10:54:40
epoch [10/50] batch [1960/2000] time 2.062 (3.721) data 0.000 (0.001) loss 0.2061 (1.2570) lr 1.9686e-03 eta 3 days, 10:43:12
epoch [10/50] batch [1980/2000] time 2.330 (3.705) data 0.000 (0.001) loss 1.4967 (1.2593) lr 1.9686e-03 eta 3 days, 10:21:16
epoch [10/50] batch [2000/2000] time 4.267 (3.711) data 0.000 (0.001) loss 2.4267 (1.2582) lr 1.9511e-03 eta 3 days, 10:27:38
epoch [11/50] batch [20/2000] time 4.309 (4.341) data 0.000 (0.029) loss 0.6935 (1.1889) lr 1.9511e-03 eta 4 days, 0:26:16
epoch [11/50] batch [40/2000] time 4.314 (4.323) data 0.000 (0.015) loss 0.2153 (1.0933) lr 1.9511e-03 eta 4 days, 0:01:13
epoch [11/50] batch [60/2000] time 4.234 (4.310) data 0.001 (0.010) loss 1.7520 (0.9634) lr 1.9511e-03 eta 3 days, 23:42:56
epoch [11/50] batch [80/2000] time 4.229 (4.305) data 0.000 (0.008) loss 1.6514 (0.9763) lr 1.9511e-03 eta 3 days, 23:34:48
epoch [11/50] batch [100/2000] time 4.215 (4.301) data 0.000 (0.006) loss 0.4024 (1.0635) lr 1.9511e-03 eta 3 days, 23:27:07
epoch [11/50] batch [120/2000] time 4.379 (4.287) data 0.000 (0.005) loss 3.1657 (1.1959) lr 1.9511e-03 eta 3 days, 23:07:43
epoch [11/50] batch [140/2000] time 4.330 (4.281) data 0.000 (0.004) loss 0.1636 (1.2094) lr 1.9511e-03 eta 3 days, 22:57:59
epoch [11/50] batch [160/2000] time 4.245 (4.283) data 0.000 (0.004) loss 0.3528 (1.1991) lr 1.9511e-03 eta 3 days, 22:59:03
epoch [11/50] batch [180/2000] time 4.277 (4.283) data 0.003 (0.004) loss 0.9060 (1.1980) lr 1.9511e-03 eta 3 days, 22:58:15
epoch [11/50] batch [200/2000] time 4.254 (4.284) data 0.000 (0.003) loss 1.1749 (1.1928) lr 1.9511e-03 eta 3 days, 22:57:20
epoch [11/50] batch [220/2000] time 4.260 (4.285) data 0.000 (0.003) loss 1.3958 (1.1914) lr 1.9511e-03 eta 3 days, 22:57:21
epoch [11/50] batch [240/2000] time 4.255 (4.286) data 0.000 (0.003) loss 1.4950 (1.2053) lr 1.9511e-03 eta 3 days, 22:57:34
epoch [11/50] batch [260/2000] time 4.284 (4.287) data 0.000 (0.003) loss 1.9034 (1.2141) lr 1.9511e-03 eta 3 days, 22:56:50
epoch [11/50] batch [280/2000] time 4.309 (4.277) data 0.000 (0.002) loss 0.3007 (1.1917) lr 1.9511e-03 eta 3 days, 22:42:21
epoch [11/50] batch [300/2000] time 4.301 (4.278) data 0.000 (0.002) loss 0.5132 (1.2043) lr 1.9511e-03 eta 3 days, 22:42:12
epoch [11/50] batch [320/2000] time 4.320 (4.280) data 0.000 (0.002) loss 1.4117 (1.1965) lr 1.9511e-03 eta 3 days, 22:43:18
epoch [11/50] batch [340/2000] time 4.288 (4.281) data 0.000 (0.002) loss 1.7166 (1.1977) lr 1.9511e-03 eta 3 days, 22:43:35
epoch [11/50] batch [360/2000] time 4.269 (4.281) data 0.000 (0.002) loss 0.6872 (1.2152) lr 1.9511e-03 eta 3 days, 22:42:54
epoch [11/50] batch [380/2000] time 4.241 (4.283) data 0.000 (0.002) loss 0.9437 (1.2265) lr 1.9511e-03 eta 3 days, 22:43:04
epoch [11/50] batch [400/2000] time 4.337 (4.284) data 0.000 (0.002) loss 2.3115 (1.2237) lr 1.9511e-03 eta 3 days, 22:43:25
epoch [11/50] batch [420/2000] time 4.424 (4.283) data 0.000 (0.002) loss 0.8207 (1.2215) lr 1.9511e-03 eta 3 days, 22:40:57
epoch [11/50] batch [440/2000] time 4.344 (4.279) data 0.000 (0.002) loss 1.4147 (1.2229) lr 1.9511e-03 eta 3 days, 22:34:30
epoch [11/50] batch [460/2000] time 4.268 (4.280) data 0.000 (0.002) loss 1.1184 (1.2364) lr 1.9511e-03 eta 3 days, 22:33:45
epoch [11/50] batch [480/2000] time 4.277 (4.281) data 0.000 (0.002) loss 1.0328 (1.2388) lr 1.9511e-03 eta 3 days, 22:33:22
epoch [11/50] batch [500/2000] time 4.300 (4.281) data 0.000 (0.002) loss 1.2193 (1.2400) lr 1.9511e-03 eta 3 days, 22:32:21
epoch [11/50] batch [520/2000] time 4.332 (4.282) data 0.000 (0.002) loss 1.5661 (1.2327) lr 1.9511e-03 eta 3 days, 22:32:21
epoch [11/50] batch [540/2000] time 4.307 (4.283) data 0.000 (0.002) loss 1.3211 (1.2257) lr 1.9511e-03 eta 3 days, 22:31:43
epoch [11/50] batch [560/2000] time 4.341 (4.280) data 0.000 (0.002) loss 2.3547 (1.2333) lr 1.9511e-03 eta 3 days, 22:26:34
epoch [11/50] batch [580/2000] time 4.311 (4.279) data 0.000 (0.001) loss 0.0861 (1.2286) lr 1.9511e-03 eta 3 days, 22:23:30
epoch [11/50] batch [600/2000] time 4.319 (4.279) data 0.001 (0.001) loss 0.5669 (1.2263) lr 1.9511e-03 eta 3 days, 22:22:34
epoch [11/50] batch [620/2000] time 4.321 (4.280) data 0.000 (0.001) loss 0.2808 (1.2237) lr 1.9511e-03 eta 3 days, 22:22:18
epoch [11/50] batch [640/2000] time 4.311 (4.281) data 0.000 (0.001) loss 1.6060 (1.2268) lr 1.9511e-03 eta 3 days, 22:22:02
epoch [11/50] batch [660/2000] time 4.344 (4.281) data 0.000 (0.001) loss 2.4250 (1.2249) lr 1.9511e-03 eta 3 days, 22:21:02
epoch [11/50] batch [680/2000] time 4.278 (4.282) data 0.000 (0.001) loss 0.2748 (1.2116) lr 1.9511e-03 eta 3 days, 22:20:38
epoch [11/50] batch [700/2000] time 4.264 (4.282) data 0.000 (0.001) loss 2.2877 (1.2111) lr 1.9511e-03 eta 3 days, 22:19:51
epoch [11/50] batch [720/2000] time 4.266 (4.281) data 0.000 (0.001) loss 0.8054 (1.2029) lr 1.9511e-03 eta 3 days, 22:16:16
epoch [11/50] batch [740/2000] time 4.306 (4.281) data 0.000 (0.001) loss 1.3826 (1.2018) lr 1.9511e-03 eta 3 days, 22:15:42
epoch [11/50] batch [760/2000] time 4.217 (4.282) data 0.000 (0.001) loss 1.7056 (1.2082) lr 1.9511e-03 eta 3 days, 22:14:54
epoch [11/50] batch [780/2000] time 4.325 (4.282) data 0.000 (0.001) loss 2.7321 (1.2116) lr 1.9511e-03 eta 3 days, 22:13:15
epoch [11/50] batch [800/2000] time 4.307 (4.282) data 0.000 (0.001) loss 1.8966 (1.2123) lr 1.9511e-03 eta 3 days, 22:12:15
epoch [11/50] batch [820/2000] time 4.301 (4.282) data 0.000 (0.001) loss 0.6798 (1.2115) lr 1.9511e-03 eta 3 days, 22:11:04
epoch [11/50] batch [840/2000] time 4.288 (4.282) data 0.000 (0.001) loss 1.0068 (1.2087) lr 1.9511e-03 eta 3 days, 22:09:46
epoch [11/50] batch [860/2000] time 4.405 (4.281) data 0.000 (0.001) loss 2.1302 (1.2090) lr 1.9511e-03 eta 3 days, 22:06:38
epoch [11/50] batch [880/2000] time 4.329 (4.280) data 0.000 (0.001) loss 2.2384 (1.2069) lr 1.9511e-03 eta 3 days, 22:03:37
epoch [11/50] batch [900/2000] time 4.342 (4.280) data 0.004 (0.001) loss 0.3560 (1.2109) lr 1.9511e-03 eta 3 days, 22:02:40
epoch [11/50] batch [920/2000] time 4.286 (4.281) data 0.000 (0.001) loss 0.4964 (1.2192) lr 1.9511e-03 eta 3 days, 22:02:03
epoch [11/50] batch [940/2000] time 4.250 (4.281) data 0.000 (0.001) loss 1.9002 (1.2168) lr 1.9511e-03 eta 3 days, 22:00:58
epoch [11/50] batch [960/2000] time 4.321 (4.281) data 0.000 (0.001) loss 0.1900 (1.2157) lr 1.9511e-03 eta 3 days, 22:00:02
epoch [11/50] batch [980/2000] time 4.332 (4.282) data 0.000 (0.001) loss 1.3216 (1.2172) lr 1.9511e-03 eta 3 days, 21:58:54
epoch [11/50] batch [1000/2000] time 4.257 (4.282) data 0.000 (0.001) loss 1.3190 (1.2231) lr 1.9511e-03 eta 3 days, 21:57:45
epoch [11/50] batch [1020/2000] time 4.212 (4.279) data 0.000 (0.001) loss 0.0681 (1.2224) lr 1.9511e-03 eta 3 days, 21:52:42
epoch [11/50] batch [1040/2000] time 4.331 (4.279) data 0.000 (0.001) loss 1.6130 (1.2276) lr 1.9511e-03 eta 3 days, 21:51:37
epoch [11/50] batch [1060/2000] time 4.317 (4.280) data 0.000 (0.001) loss 0.0775 (1.2287) lr 1.9511e-03 eta 3 days, 21:50:33
epoch [11/50] batch [1080/2000] time 4.330 (4.280) data 0.000 (0.001) loss 1.0568 (1.2286) lr 1.9511e-03 eta 3 days, 21:49:19
epoch [11/50] batch [1100/2000] time 4.284 (4.280) data 0.000 (0.001) loss 4.3137 (1.2251) lr 1.9511e-03 eta 3 days, 21:48:22
epoch [11/50] batch [1120/2000] time 4.296 (4.280) data 0.000 (0.001) loss 1.4558 (1.2266) lr 1.9511e-03 eta 3 days, 21:46:58
epoch [11/50] batch [1140/2000] time 4.209 (4.280) data 0.001 (0.001) loss 0.2166 (1.2254) lr 1.9511e-03 eta 3 days, 21:45:44
epoch [11/50] batch [1160/2000] time 4.355 (4.279) data 0.000 (0.001) loss 1.2286 (1.2271) lr 1.9511e-03 eta 3 days, 21:42:50
epoch [11/50] batch [1180/2000] time 4.278 (4.278) data 0.000 (0.001) loss 1.1849 (1.2260) lr 1.9511e-03 eta 3 days, 21:39:13
epoch [11/50] batch [1200/2000] time 4.222 (4.278) data 0.000 (0.001) loss 0.1912 (1.2281) lr 1.9511e-03 eta 3 days, 21:37:54
epoch [11/50] batch [1220/2000] time 4.285 (4.278) data 0.000 (0.001) loss 1.8065 (1.2245) lr 1.9511e-03 eta 3 days, 21:36:39
epoch [11/50] batch [1240/2000] time 4.280 (4.278) data 0.000 (0.001) loss 2.5311 (1.2257) lr 1.9511e-03 eta 3 days, 21:35:33
epoch [11/50] batch [1260/2000] time 4.315 (4.278) data 0.000 (0.001) loss 1.9904 (1.2255) lr 1.9511e-03 eta 3 days, 21:34:31
epoch [11/50] batch [1280/2000] time 4.306 (4.278) data 0.000 (0.001) loss 1.4252 (1.2262) lr 1.9511e-03 eta 3 days, 21:33:06
epoch [11/50] batch [1300/2000] time 4.282 (4.278) data 0.009 (0.001) loss 1.1333 (1.2279) lr 1.9511e-03 eta 3 days, 21:31:39
epoch [11/50] batch [1320/2000] time 4.297 (4.276) data 0.000 (0.001) loss 0.6778 (1.2239) lr 1.9511e-03 eta 3 days, 21:27:21
epoch [11/50] batch [1340/2000] time 4.341 (4.276) data 0.000 (0.001) loss 0.8940 (1.2199) lr 1.9511e-03 eta 3 days, 21:26:11
epoch [11/50] batch [1360/2000] time 4.247 (4.276) data 0.000 (0.001) loss 1.3832 (1.2191) lr 1.9511e-03 eta 3 days, 21:24:51
epoch [11/50] batch [1380/2000] time 4.278 (4.276) data 0.000 (0.001) loss 0.5105 (1.2185) lr 1.9511e-03 eta 3 days, 21:23:35
epoch [11/50] batch [1400/2000] time 4.274 (4.277) data 0.000 (0.001) loss 1.2249 (1.2185) lr 1.9511e-03 eta 3 days, 21:22:13
epoch [11/50] batch [1420/2000] time 4.291 (4.277) data 0.000 (0.001) loss 1.0616 (1.2177) lr 1.9511e-03 eta 3 days, 21:20:58
epoch [11/50] batch [1440/2000] time 4.295 (4.277) data 0.000 (0.001) loss 0.1835 (1.2166) lr 1.9511e-03 eta 3 days, 21:19:49
epoch [11/50] batch [1460/2000] time 4.364 (4.276) data 0.000 (0.001) loss 0.9371 (1.2185) lr 1.9511e-03 eta 3 days, 21:17:48
epoch [11/50] batch [1480/2000] time 4.270 (4.275) data 0.000 (0.001) loss 0.3078 (1.2149) lr 1.9511e-03 eta 3 days, 21:15:08
epoch [11/50] batch [1500/2000] time 4.304 (4.276) data 0.001 (0.001) loss 0.8037 (1.2114) lr 1.9511e-03 eta 3 days, 21:14:06
epoch [11/50] batch [1520/2000] time 4.288 (4.276) data 0.000 (0.001) loss 0.9129 (1.2132) lr 1.9511e-03 eta 3 days, 21:13:10
epoch [11/50] batch [1540/2000] time 4.327 (4.276) data 0.000 (0.001) loss 1.4959 (1.2124) lr 1.9511e-03 eta 3 days, 21:12:10
epoch [11/50] batch [1560/2000] time 4.237 (4.277) data 0.000 (0.001) loss 1.4502 (1.2105) lr 1.9511e-03 eta 3 days, 21:11:09
epoch [11/50] batch [1580/2000] time 4.349 (4.277) data 0.001 (0.001) loss 0.6383 (1.2079) lr 1.9511e-03 eta 3 days, 21:10:13
epoch [11/50] batch [1600/2000] time 4.436 (4.276) data 0.000 (0.001) loss 0.9938 (1.2071) lr 1.9511e-03 eta 3 days, 21:07:34
epoch [11/50] batch [1620/2000] time 4.324 (4.276) data 0.000 (0.001) loss 1.6495 (1.2029) lr 1.9511e-03 eta 3 days, 21:05:44
epoch [11/50] batch [1640/2000] time 4.253 (4.276) data 0.000 (0.001) loss 0.3467 (1.2032) lr 1.9511e-03 eta 3 days, 21:04:45
epoch [11/50] batch [1660/2000] time 4.286 (4.276) data 0.000 (0.001) loss 0.6979 (1.2033) lr 1.9511e-03 eta 3 days, 21:03:32
epoch [11/50] batch [1680/2000] time 4.279 (4.276) data 0.001 (0.001) loss 1.2475 (1.2007) lr 1.9511e-03 eta 3 days, 21:02:05
epoch [11/50] batch [1700/2000] time 4.300 (4.277) data 0.000 (0.001) loss 0.4138 (1.2016) lr 1.9511e-03 eta 3 days, 21:01:01
epoch [11/50] batch [1720/2000] time 4.284 (4.277) data 0.000 (0.001) loss 2.8787 (1.1981) lr 1.9511e-03 eta 3 days, 21:00:01
epoch [11/50] batch [1740/2000] time 4.288 (4.277) data 0.000 (0.001) loss 1.6020 (1.2008) lr 1.9511e-03 eta 3 days, 20:59:04
epoch [11/50] batch [1760/2000] time 4.341 (4.277) data 0.000 (0.001) loss 0.0954 (1.1997) lr 1.9511e-03 eta 3 days, 20:56:36
epoch [11/50] batch [1780/2000] time 4.339 (4.277) data 0.000 (0.001) loss 2.8039 (1.2000) lr 1.9511e-03 eta 3 days, 20:55:35
epoch [11/50] batch [1800/2000] time 4.264 (4.277) data 0.000 (0.001) loss 0.4935 (1.1982) lr 1.9511e-03 eta 3 days, 20:54:29
epoch [11/50] batch [1820/2000] time 4.319 (4.277) data 0.000 (0.001) loss 2.5283 (1.1996) lr 1.9511e-03 eta 3 days, 20:53:09
epoch [11/50] batch [1840/2000] time 4.312 (4.277) data 0.000 (0.001) loss 0.5367 (1.1971) lr 1.9511e-03 eta 3 days, 20:51:59
epoch [11/50] batch [1860/2000] time 4.316 (4.278) data 0.000 (0.001) loss 0.3268 (1.1952) lr 1.9511e-03 eta 3 days, 20:50:54
epoch [11/50] batch [1880/2000] time 4.335 (4.278) data 0.000 (0.001) loss 3.9122 (1.1999) lr 1.9511e-03 eta 3 days, 20:49:45
epoch [11/50] batch [1900/2000] time 4.321 (4.277) data 0.001 (0.001) loss 0.3633 (1.2062) lr 1.9511e-03 eta 3 days, 20:47:38
epoch [11/50] batch [1920/2000] time 4.318 (4.277) data 0.000 (0.001) loss 1.6159 (1.2047) lr 1.9511e-03 eta 3 days, 20:46:16
epoch [11/50] batch [1940/2000] time 4.317 (4.278) data 0.001 (0.001) loss 0.5680 (1.2023) lr 1.9511e-03 eta 3 days, 20:45:10
epoch [11/50] batch [1960/2000] time 4.250 (4.278) data 0.000 (0.001) loss 1.5600 (1.1999) lr 1.9511e-03 eta 3 days, 20:43:48
epoch [11/50] batch [1980/2000] time 4.281 (4.278) data 0.000 (0.001) loss 1.7178 (1.1992) lr 1.9511e-03 eta 3 days, 20:42:30
epoch [11/50] batch [2000/2000] time 4.246 (4.278) data 0.000 (0.001) loss 2.0979 (1.2018) lr 1.9298e-03 eta 3 days, 20:41:18
epoch [12/50] batch [20/2000] time 4.327 (4.330) data 0.000 (0.036) loss 0.3709 (1.4517) lr 1.9298e-03 eta 3 days, 21:47:23
epoch [12/50] batch [40/2000] time 3.240 (4.271) data 0.000 (0.018) loss 2.0922 (1.2938) lr 1.9298e-03 eta 3 days, 20:29:42
epoch [12/50] batch [60/2000] time 4.449 (4.276) data 0.008 (0.012) loss 1.8126 (1.2120) lr 1.9298e-03 eta 3 days, 20:34:31
epoch [12/50] batch [80/2000] time 3.788 (3.873) data 0.000 (0.010) loss 1.1163 (1.1340) lr 1.9298e-03 eta 3 days, 11:49:52
epoch [12/50] batch [100/2000] time 2.952 (3.676) data 0.002 (0.008) loss 0.1357 (1.1352) lr 1.9298e-03 eta 3 days, 7:32:53
epoch [12/50] batch [120/2000] time 3.356 (3.484) data 0.000 (0.007) loss 1.1999 (1.2123) lr 1.9298e-03 eta 3 days, 3:22:31
epoch [12/50] batch [140/2000] time 2.021 (3.356) data 0.000 (0.006) loss 0.4392 (1.2879) lr 1.9298e-03 eta 3 days, 0:34:30
epoch [12/50] batch [160/2000] time 2.505 (3.240) data 0.000 (0.005) loss 0.9148 (1.2391) lr 1.9298e-03 eta 2 days, 22:03:15
epoch [12/50] batch [180/2000] time 3.741 (3.253) data 0.000 (0.005) loss 1.5101 (1.2490) lr 1.9298e-03 eta 2 days, 22:18:45
epoch [12/50] batch [200/2000] time 3.196 (3.257) data 0.000 (0.004) loss 6.8163 (1.2830) lr 1.9298e-03 eta 2 days, 22:23:20
epoch [12/50] batch [220/2000] time 3.102 (3.207) data 0.000 (0.004) loss 1.7314 (1.3008) lr 1.9298e-03 eta 2 days, 21:17:23
epoch [12/50] batch [240/2000] time 2.571 (3.146) data 0.000 (0.004) loss 1.0773 (1.3205) lr 1.9298e-03 eta 2 days, 19:56:37
epoch [12/50] batch [260/2000] time 3.032 (3.091) data 0.000 (0.003) loss 0.0276 (1.3091) lr 1.9298e-03 eta 2 days, 18:44:49
epoch [12/50] batch [280/2000] time 2.875 (3.062) data 0.000 (0.003) loss 1.0092 (1.2838) lr 1.9298e-03 eta 2 days, 18:06:47
epoch [12/50] batch [300/2000] time 3.687 (3.084) data 0.000 (0.003) loss 0.4384 (1.2634) lr 1.9298e-03 eta 2 days, 18:33:26
epoch [12/50] batch [320/2000] time 2.060 (3.064) data 0.000 (0.003) loss 2.1438 (1.2648) lr 1.9298e-03 eta 2 days, 18:06:38
epoch [12/50] batch [340/2000] time 2.056 (3.031) data 0.000 (0.003) loss 0.8860 (1.2608) lr 1.9298e-03 eta 2 days, 17:22:29
epoch [12/50] batch [360/2000] time 2.834 (3.025) data 0.000 (0.003) loss 0.2809 (1.2482) lr 1.9298e-03 eta 2 days, 17:14:01
epoch [12/50] batch [380/2000] time 2.857 (3.035) data 0.000 (0.002) loss 0.1747 (1.2655) lr 1.9298e-03 eta 2 days, 17:26:32
epoch [12/50] batch [400/2000] time 3.699 (3.051) data 0.000 (0.002) loss 0.1289 (1.2642) lr 1.9298e-03 eta 2 days, 17:45:46
epoch [12/50] batch [420/2000] time 2.012 (3.060) data 0.001 (0.002) loss 1.0508 (1.2658) lr 1.9298e-03 eta 2 days, 17:56:51
epoch [12/50] batch [440/2000] time 2.210 (3.020) data 0.000 (0.002) loss 1.1633 (1.2571) lr 1.9298e-03 eta 2 days, 17:04:02
epoch [12/50] batch [460/2000] time 4.106 (3.060) data 0.000 (0.002) loss 0.4328 (1.2504) lr 1.9298e-03 eta 2 days, 17:54:12
epoch [12/50] batch [480/2000] time 4.129 (3.084) data 0.000 (0.002) loss 1.4380 (1.2511) lr 1.9298e-03 eta 2 days, 18:25:02
epoch [12/50] batch [500/2000] time 4.107 (3.125) data 0.000 (0.002) loss 1.2425 (1.2560) lr 1.9298e-03 eta 2 days, 19:16:27
epoch [12/50] batch [520/2000] time 4.130 (3.153) data 0.000 (0.002) loss 1.6371 (1.2612) lr 1.9298e-03 eta 2 days, 19:52:07
epoch [12/50] batch [540/2000] time 4.062 (3.178) data 0.001 (0.002) loss 0.2843 (1.2523) lr 1.9298e-03 eta 2 days, 20:22:58
epoch [12/50] batch [560/2000] time 3.920 (3.211) data 0.001 (0.002) loss 0.5733 (1.2386) lr 1.9298e-03 eta 2 days, 21:04:47
epoch [12/50] batch [580/2000] time 4.113 (3.234) data 0.000 (0.002) loss 1.7604 (1.2344) lr 1.9298e-03 eta 2 days, 21:33:10
epoch [12/50] batch [600/2000] time 4.085 (3.255) data 0.002 (0.002) loss 1.1224 (1.2276) lr 1.9298e-03 eta 2 days, 21:58:31
epoch [12/50] batch [620/2000] time 2.869 (3.280) data 0.000 (0.002) loss 0.3620 (1.2297) lr 1.9298e-03 eta 2 days, 22:30:21
epoch [12/50] batch [640/2000] time 4.032 (3.300) data 0.000 (0.002) loss 0.8387 (1.2307) lr 1.9298e-03 eta 2 days, 22:54:16
epoch [12/50] batch [660/2000] time 4.079 (3.318) data 0.000 (0.002) loss 1.5832 (1.2293) lr 1.9298e-03 eta 2 days, 23:16:28
epoch [12/50] batch [680/2000] time 2.044 (3.337) data 0.000 (0.002) loss 0.5005 (1.2328) lr 1.9298e-03 eta 2 days, 23:39:46
epoch [12/50] batch [700/2000] time 4.064 (3.356) data 0.001 (0.002) loss 1.1847 (1.2251) lr 1.9298e-03 eta 3 days, 0:03:25
epoch [12/50] batch [720/2000] time 4.118 (3.369) data 0.000 (0.002) loss 0.2108 (1.2187) lr 1.9298e-03 eta 3 days, 0:19:28
epoch [12/50] batch [740/2000] time 2.322 (3.384) data 0.000 (0.002) loss 0.9280 (1.2128) lr 1.9298e-03 eta 3 days, 0:38:04
epoch [12/50] batch [760/2000] time 4.130 (3.401) data 0.003 (0.002) loss 2.2577 (1.2126) lr 1.9298e-03 eta 3 days, 0:58:30
epoch [12/50] batch [780/2000] time 4.141 (3.414) data 0.000 (0.002) loss 2.7210 (1.2108) lr 1.9298e-03 eta 3 days, 1:13:52
epoch [12/50] batch [800/2000] time 2.230 (3.425) data 0.000 (0.002) loss 0.8773 (1.2187) lr 1.9298e-03 eta 3 days, 1:26:40
epoch [12/50] batch [820/2000] time 4.133 (3.441) data 0.000 (0.002) loss 1.6803 (1.2129) lr 1.9298e-03 eta 3 days, 1:46:31
epoch [12/50] batch [840/2000] time 4.055 (3.452) data 0.000 (0.002) loss 3.2016 (1.2218) lr 1.9298e-03 eta 3 days, 1:59:12
epoch [12/50] batch [860/2000] time 4.096 (3.462) data 0.012 (0.002) loss 1.8267 (1.2196) lr 1.9298e-03 eta 3 days, 2:10:52
epoch [12/50] batch [880/2000] time 4.178 (3.477) data 0.000 (0.002) loss 1.4984 (1.2157) lr 1.9298e-03 eta 3 days, 2:29:03
epoch [12/50] batch [900/2000] time 4.135 (3.485) data 0.002 (0.002) loss 3.9054 (1.2205) lr 1.9298e-03 eta 3 days, 2:38:49
epoch [12/50] batch [920/2000] time 4.104 (3.494) data 0.000 (0.002) loss 3.3357 (1.2271) lr 1.9298e-03 eta 3 days, 2:49:07
epoch [12/50] batch [940/2000] time 4.080 (3.507) data 0.000 (0.002) loss 2.2828 (1.2305) lr 1.9298e-03 eta 3 days, 3:04:46
epoch [12/50] batch [960/2000] time 4.091 (3.515) data 0.000 (0.002) loss 2.7501 (1.2277) lr 1.9298e-03 eta 3 days, 3:12:53
epoch [12/50] batch [980/2000] time 4.111 (3.523) data 0.000 (0.001) loss 1.1983 (1.2292) lr 1.9298e-03 eta 3 days, 3:22:04
epoch [12/50] batch [1000/2000] time 4.162 (3.535) data 0.000 (0.001) loss 1.2007 (1.2339) lr 1.9298e-03 eta 3 days, 3:36:03
epoch [12/50] batch [1020/2000] time 4.037 (3.542) data 0.014 (0.001) loss 2.2474 (1.2358) lr 1.9298e-03 eta 3 days, 3:44:25
epoch [12/50] batch [1040/2000] time 2.023 (3.540) data 0.000 (0.001) loss 0.8779 (1.2325) lr 1.9298e-03 eta 3 days, 3:40:18
epoch [12/50] batch [1060/2000] time 2.196 (3.514) data 0.001 (0.001) loss 1.5164 (1.2353) lr 1.9298e-03 eta 3 days, 3:06:35
epoch [12/50] batch [1080/2000] time 2.086 (3.491) data 0.000 (0.001) loss 1.2590 (1.2297) lr 1.9298e-03 eta 3 days, 2:35:05
epoch [12/50] batch [1100/2000] time 2.390 (3.467) data 0.000 (0.001) loss 1.8715 (1.2345) lr 1.9298e-03 eta 3 days, 2:03:37
epoch [12/50] batch [1120/2000] time 2.677 (3.446) data 0.000 (0.001) loss 2.4960 (1.2409) lr 1.9298e-03 eta 3 days, 1:35:25
epoch [12/50] batch [1140/2000] time 3.836 (3.432) data 0.001 (0.001) loss 1.3481 (1.2474) lr 1.9298e-03 eta 3 days, 1:16:08
epoch [12/50] batch [1160/2000] time 3.950 (3.435) data 0.000 (0.001) loss 0.3270 (1.2441) lr 1.9298e-03 eta 3 days, 1:19:24
epoch [12/50] batch [1180/2000] time 3.867 (3.439) data 0.000 (0.001) loss 0.7206 (1.2406) lr 1.9298e-03 eta 3 days, 1:22:51
epoch [12/50] batch [1200/2000] time 3.883 (3.443) data 0.000 (0.001) loss 3.3286 (1.2447) lr 1.9298e-03 eta 3 days, 1:27:26
epoch [12/50] batch [1220/2000] time 3.907 (3.447) data 0.000 (0.001) loss 0.0612 (1.2449) lr 1.9298e-03 eta 3 days, 1:30:56
epoch [12/50] batch [1240/2000] time 3.912 (3.451) data 0.001 (0.001) loss 1.4369 (1.2428) lr 1.9298e-03 eta 3 days, 1:34:46
epoch [12/50] batch [1260/2000] time 3.901 (3.455) data 0.000 (0.001) loss 1.8774 (1.2445) lr 1.9298e-03 eta 3 days, 1:38:18
epoch [12/50] batch [1280/2000] time 2.433 (3.449) data 0.000 (0.001) loss 1.1242 (1.2430) lr 1.9298e-03 eta 3 days, 1:30:03
epoch [12/50] batch [1300/2000] time 2.073 (3.429) data 0.000 (0.001) loss 0.9209 (1.2481) lr 1.9298e-03 eta 3 days, 1:03:25
epoch [12/50] batch [1320/2000] time 2.072 (3.410) data 0.000 (0.001) loss 0.8579 (1.2453) lr 1.9298e-03 eta 3 days, 0:38:21
epoch [12/50] batch [1340/2000] time 3.756 (3.405) data 0.000 (0.001) loss 1.4175 (1.2429) lr 1.9298e-03 eta 3 days, 0:30:59
epoch [12/50] batch [1360/2000] time 2.352 (3.403) data 0.000 (0.001) loss 0.0549 (1.2432) lr 1.9298e-03 eta 3 days, 0:26:30
epoch [12/50] batch [1380/2000] time 2.009 (3.385) data 0.000 (0.001) loss 0.9865 (1.2468) lr 1.9298e-03 eta 3 days, 0:02:07
epoch [12/50] batch [1400/2000] time 2.040 (3.365) data 0.000 (0.001) loss 0.8016 (1.2464) lr 1.9298e-03 eta 2 days, 23:36:33
epoch [12/50] batch [1420/2000] time 2.007 (3.347) data 0.000 (0.001) loss 0.4622 (1.2423) lr 1.9298e-03 eta 2 days, 23:11:38
epoch [12/50] batch [1440/2000] time 2.009 (3.329) data 0.000 (0.001) loss 1.6137 (1.2442) lr 1.9298e-03 eta 2 days, 22:47:43
epoch [12/50] batch [1460/2000] time 2.010 (3.311) data 0.005 (0.001) loss 0.4942 (1.2432) lr 1.9298e-03 eta 2 days, 22:24:13
epoch [12/50] batch [1480/2000] time 2.067 (3.294) data 0.000 (0.001) loss 0.1964 (1.2463) lr 1.9298e-03 eta 2 days, 22:01:23
epoch [12/50] batch [1500/2000] time 2.066 (3.278) data 0.000 (0.001) loss 0.8706 (1.2445) lr 1.9298e-03 eta 2 days, 21:39:02
epoch [12/50] batch [1520/2000] time 2.008 (3.261) data 0.000 (0.001) loss 0.1293 (1.2414) lr 1.9298e-03 eta 2 days, 21:17:13
epoch [12/50] batch [1540/2000] time 1.984 (3.245) data 0.000 (0.001) loss 1.0426 (1.2395) lr 1.9298e-03 eta 2 days, 20:55:48
epoch [12/50] batch [1560/2000] time 2.012 (3.230) data 0.000 (0.001) loss 0.8625 (1.2410) lr 1.9298e-03 eta 2 days, 20:35:03
epoch [12/50] batch [1580/2000] time 2.073 (3.215) data 0.000 (0.001) loss 0.2292 (1.2373) lr 1.9298e-03 eta 2 days, 20:14:54
epoch [12/50] batch [1600/2000] time 2.042 (3.200) data 0.000 (0.001) loss 0.1317 (1.2344) lr 1.9298e-03 eta 2 days, 19:55:16
epoch [12/50] batch [1620/2000] time 1.981 (3.186) data 0.000 (0.001) loss 1.4230 (1.2408) lr 1.9298e-03 eta 2 days, 19:36:05
epoch [12/50] batch [1640/2000] time 2.068 (3.173) data 0.000 (0.001) loss 0.9441 (1.2363) lr 1.9298e-03 eta 2 days, 19:17:34
epoch [12/50] batch [1660/2000] time 2.078 (3.159) data 0.000 (0.001) loss 0.9966 (1.2355) lr 1.9298e-03 eta 2 days, 18:59:18
epoch [12/50] batch [1680/2000] time 2.016 (3.146) data 0.001 (0.001) loss 0.8011 (1.2341) lr 1.9298e-03 eta 2 days, 18:41:21
epoch [12/50] batch [1700/2000] time 2.047 (3.133) data 0.000 (0.001) loss 0.2626 (1.2341) lr 1.9298e-03 eta 2 days, 18:23:48
epoch [12/50] batch [1720/2000] time 2.065 (3.120) data 0.000 (0.001) loss 0.6175 (1.2325) lr 1.9298e-03 eta 2 days, 18:06:41
epoch [12/50] batch [1740/2000] time 2.062 (3.108) data 0.000 (0.001) loss 0.6656 (1.2344) lr 1.9298e-03 eta 2 days, 17:49:54
epoch [12/50] batch [1760/2000] time 2.044 (3.096) data 0.000 (0.001) loss 0.2547 (1.2353) lr 1.9298e-03 eta 2 days, 17:33:27
epoch [12/50] batch [1780/2000] time 1.991 (3.084) data 0.000 (0.001) loss 0.3487 (1.2348) lr 1.9298e-03 eta 2 days, 17:17:20
epoch [12/50] batch [1800/2000] time 2.060 (3.072) data 0.000 (0.001) loss 4.3676 (1.2363) lr 1.9298e-03 eta 2 days, 17:01:37
epoch [12/50] batch [1820/2000] time 1.986 (3.061) data 0.000 (0.001) loss 3.4965 (1.2378) lr 1.9298e-03 eta 2 days, 16:46:12
epoch [12/50] batch [1840/2000] time 2.040 (3.050) data 0.000 (0.001) loss 1.5994 (1.2389) lr 1.9298e-03 eta 2 days, 16:31:13
epoch [12/50] batch [1860/2000] time 1.985 (3.039) data 0.000 (0.001) loss 1.6905 (1.2401) lr 1.9298e-03 eta 2 days, 16:16:24
epoch [12/50] batch [1880/2000] time 2.079 (3.028) data 0.000 (0.001) loss 0.4523 (1.2395) lr 1.9298e-03 eta 2 days, 16:02:04
epoch [12/50] batch [1900/2000] time 2.035 (3.018) data 0.000 (0.001) loss 0.7324 (1.2352) lr 1.9298e-03 eta 2 days, 15:47:53
epoch [12/50] batch [1920/2000] time 2.057 (3.008) data 0.000 (0.001) loss 2.9379 (1.2319) lr 1.9298e-03 eta 2 days, 15:33:59
epoch [12/50] batch [1940/2000] time 2.061 (2.998) data 0.000 (0.001) loss 0.5689 (1.2288) lr 1.9298e-03 eta 2 days, 15:20:25
epoch [12/50] batch [1960/2000] time 2.057 (2.988) data 0.000 (0.001) loss 0.1860 (1.2263) lr 1.9298e-03 eta 2 days, 15:07:02
epoch [12/50] batch [1980/2000] time 2.064 (2.979) data 0.000 (0.001) loss 0.6707 (1.2308) lr 1.9298e-03 eta 2 days, 14:53:49
epoch [12/50] batch [2000/2000] time 2.034 (2.969) data 0.000 (0.001) loss 1.1407 (1.2273) lr 1.9048e-03 eta 2 days, 14:40:51
epoch [13/50] batch [20/2000] time 2.011 (2.082) data 0.001 (0.035) loss 1.1313 (1.3425) lr 1.9048e-03 eta 1 day, 19:56:27
epoch [13/50] batch [40/2000] time 2.061 (2.061) data 0.000 (0.018) loss 0.5082 (1.3282) lr 1.9048e-03 eta 1 day, 19:29:18
epoch [13/50] batch [60/2000] time 2.060 (2.054) data 0.000 (0.012) loss 0.2639 (1.2535) lr 1.9048e-03 eta 1 day, 19:19:05
epoch [13/50] batch [80/2000] time 2.042 (2.049) data 0.000 (0.009) loss 0.0965 (1.2054) lr 1.9048e-03 eta 1 day, 19:13:09
epoch [13/50] batch [100/2000] time 2.057 (2.049) data 0.000 (0.007) loss 1.0308 (1.2629) lr 1.9048e-03 eta 1 day, 19:12:02
epoch [13/50] batch [120/2000] time 2.036 (2.046) data 0.000 (0.006) loss 0.1769 (1.2268) lr 1.9048e-03 eta 1 day, 19:07:27
epoch [13/50] batch [140/2000] time 2.040 (2.045) data 0.000 (0.005) loss 2.2041 (1.2531) lr 1.9048e-03 eta 1 day, 19:05:59
epoch [13/50] batch [160/2000] time 2.006 (2.046) data 0.000 (0.005) loss 0.2971 (1.2324) lr 1.9048e-03 eta 1 day, 19:05:52
epoch [13/50] batch [180/2000] time 2.070 (2.045) data 0.000 (0.004) loss 0.3245 (1.2364) lr 1.9048e-03 eta 1 day, 19:03:45
epoch [13/50] batch [200/2000] time 2.010 (2.044) data 0.000 (0.004) loss 2.2994 (1.2439) lr 1.9048e-03 eta 1 day, 19:02:23
epoch [13/50] batch [220/2000] time 2.035 (2.044) data 0.000 (0.003) loss 2.1830 (1.2471) lr 1.9048e-03 eta 1 day, 19:01:56
epoch [13/50] batch [240/2000] time 2.064 (2.044) data 0.000 (0.003) loss 1.2491 (1.2073) lr 1.9048e-03 eta 1 day, 19:00:56
epoch [13/50] batch [260/2000] time 2.062 (2.044) data 0.000 (0.003) loss 0.3741 (1.1884) lr 1.9048e-03 eta 1 day, 19:00:14
epoch [13/50] batch [280/2000] time 2.075 (2.044) data 0.000 (0.003) loss 1.8412 (1.1665) lr 1.9048e-03 eta 1 day, 18:59:13
epoch [13/50] batch [300/2000] time 2.060 (2.044) data 0.000 (0.003) loss 0.0803 (1.1955) lr 1.9048e-03 eta 1 day, 18:59:03
epoch [13/50] batch [320/2000] time 2.059 (2.044) data 0.000 (0.002) loss 0.4652 (1.1908) lr 1.9048e-03 eta 1 day, 18:58:22
epoch [13/50] batch [340/2000] time 2.043 (2.044) data 0.000 (0.002) loss 1.3564 (1.1929) lr 1.9048e-03 eta 1 day, 18:56:55
epoch [13/50] batch [360/2000] time 2.055 (2.043) data 0.000 (0.002) loss 1.1932 (1.2085) lr 1.9048e-03 eta 1 day, 18:55:25
epoch [13/50] batch [380/2000] time 2.056 (2.042) data 0.000 (0.002) loss 0.7994 (1.2057) lr 1.9048e-03 eta 1 day, 18:53:57
epoch [13/50] batch [400/2000] time 2.005 (2.042) data 0.000 (0.002) loss 4.0141 (1.2201) lr 1.9048e-03 eta 1 day, 18:52:52
epoch [13/50] batch [420/2000] time 2.004 (2.042) data 0.000 (0.002) loss 0.3469 (1.2249) lr 1.9048e-03 eta 1 day, 18:51:51
epoch [13/50] batch [440/2000] time 2.006 (2.041) data 0.000 (0.002) loss 1.8547 (1.2397) lr 1.9048e-03 eta 1 day, 18:50:23
epoch [13/50] batch [460/2000] time 1.983 (2.041) data 0.000 (0.002) loss 0.8497 (1.2343) lr 1.9048e-03 eta 1 day, 18:49:02
epoch [13/50] batch [480/2000] time 2.060 (2.040) data 0.000 (0.002) loss 2.3575 (1.2362) lr 1.9048e-03 eta 1 day, 18:48:15
epoch [13/50] batch [500/2000] time 2.006 (2.041) data 0.000 (0.002) loss 0.8496 (1.2348) lr 1.9048e-03 eta 1 day, 18:47:42
epoch [13/50] batch [520/2000] time 2.057 (2.040) data 0.000 (0.002) loss 1.0854 (1.2339) lr 1.9048e-03 eta 1 day, 18:46:54
epoch [13/50] batch [540/2000] time 2.057 (2.041) data 0.000 (0.002) loss 1.3041 (1.2372) lr 1.9048e-03 eta 1 day, 18:46:21
epoch [13/50] batch [560/2000] time 2.064 (2.041) data 0.000 (0.002) loss 3.9987 (1.2533) lr 1.9048e-03 eta 1 day, 18:45:52
epoch [13/50] batch [580/2000] time 2.051 (2.041) data 0.000 (0.002) loss 0.2600 (1.2501) lr 1.9048e-03 eta 1 day, 18:45:14
epoch [13/50] batch [600/2000] time 2.080 (2.041) data 0.001 (0.001) loss 1.3202 (1.2443) lr 1.9048e-03 eta 1 day, 18:44:47
epoch [13/50] batch [620/2000] time 2.015 (2.041) data 0.001 (0.001) loss 3.4549 (1.2574) lr 1.9048e-03 eta 1 day, 18:44:36
epoch [13/50] batch [640/2000] time 2.013 (2.042) data 0.000 (0.001) loss 1.5745 (1.2647) lr 1.9048e-03 eta 1 day, 18:44:21
epoch [13/50] batch [660/2000] time 2.049 (2.042) data 0.000 (0.001) loss 4.1614 (1.2638) lr 1.9048e-03 eta 1 day, 18:43:37
epoch [13/50] batch [680/2000] time 2.046 (2.042) data 0.000 (0.001) loss 2.0396 (1.2629) lr 1.9048e-03 eta 1 day, 18:43:30
epoch [13/50] batch [700/2000] time 2.019 (2.042) data 0.000 (0.001) loss 0.3561 (1.2560) lr 1.9048e-03 eta 1 day, 18:43:09
epoch [13/50] batch [720/2000] time 2.017 (2.043) data 0.000 (0.001) loss 0.8982 (1.2443) lr 1.9048e-03 eta 1 day, 18:42:46
epoch [13/50] batch [740/2000] time 2.015 (2.043) data 0.000 (0.001) loss 0.1333 (1.2426) lr 1.9048e-03 eta 1 day, 18:42:20
epoch [13/50] batch [760/2000] time 2.043 (2.043) data 0.000 (0.001) loss 2.4393 (1.2518) lr 1.9048e-03 eta 1 day, 18:41:48
epoch [13/50] batch [780/2000] time 2.063 (2.043) data 0.000 (0.001) loss 0.4475 (1.2474) lr 1.9048e-03 eta 1 day, 18:41:18
epoch [13/50] batch [800/2000] time 2.054 (2.043) data 0.000 (0.001) loss 0.5561 (1.2516) lr 1.9048e-03 eta 1 day, 18:40:39
epoch [13/50] batch [820/2000] time 2.063 (2.043) data 0.000 (0.001) loss 0.6259 (1.2491) lr 1.9048e-03 eta 1 day, 18:40:01
epoch [13/50] batch [840/2000] time 1.986 (2.043) data 0.000 (0.001) loss 2.0417 (1.2499) lr 1.9048e-03 eta 1 day, 18:39:27
epoch [13/50] batch [860/2000] time 2.062 (2.043) data 0.000 (0.001) loss 1.3247 (1.2488) lr 1.9048e-03 eta 1 day, 18:38:54
epoch [13/50] batch [880/2000] time 2.063 (2.043) data 0.000 (0.001) loss 0.5158 (1.2422) lr 1.9048e-03 eta 1 day, 18:38:05
epoch [13/50] batch [900/2000] time 1.987 (2.043) data 0.000 (0.001) loss 0.8014 (1.2387) lr 1.9048e-03 eta 1 day, 18:37:22
epoch [13/50] batch [920/2000] time 2.061 (2.043) data 0.000 (0.001) loss 1.9414 (1.2422) lr 1.9048e-03 eta 1 day, 18:36:46
epoch [13/50] batch [940/2000] time 2.009 (2.043) data 0.000 (0.001) loss 0.1625 (1.2426) lr 1.9048e-03 eta 1 day, 18:35:56
epoch [13/50] batch [960/2000] time 2.047 (2.043) data 0.000 (0.001) loss 2.2367 (1.2396) lr 1.9048e-03 eta 1 day, 18:35:24
epoch [13/50] batch [980/2000] time 2.043 (2.043) data 0.000 (0.001) loss 0.7961 (1.2372) lr 1.9048e-03 eta 1 day, 18:34:38
epoch [13/50] batch [1000/2000] time 2.066 (2.043) data 0.000 (0.001) loss 1.6263 (1.2400) lr 1.9048e-03 eta 1 day, 18:33:47
epoch [13/50] batch [1020/2000] time 2.010 (2.043) data 0.000 (0.001) loss 1.1852 (1.2362) lr 1.9048e-03 eta 1 day, 18:33:04
epoch [13/50] batch [1040/2000] time 2.017 (2.043) data 0.000 (0.001) loss 2.1876 (1.2313) lr 1.9048e-03 eta 1 day, 18:32:22
epoch [13/50] batch [1060/2000] time 2.070 (2.043) data 0.000 (0.001) loss 0.6814 (1.2341) lr 1.9048e-03 eta 1 day, 18:31:50
epoch [13/50] batch [1080/2000] time 2.016 (2.043) data 0.000 (0.001) loss 2.6026 (1.2306) lr 1.9048e-03 eta 1 day, 18:31:07
epoch [13/50] batch [1100/2000] time 2.068 (2.043) data 0.000 (0.001) loss 1.4391 (1.2357) lr 1.9048e-03 eta 1 day, 18:30:26
epoch [13/50] batch [1120/2000] time 2.069 (2.043) data 0.000 (0.001) loss 0.1931 (1.2328) lr 1.9048e-03 eta 1 day, 18:29:41
epoch [13/50] batch [1140/2000] time 2.039 (2.043) data 0.001 (0.001) loss 1.4843 (1.2302) lr 1.9048e-03 eta 1 day, 18:28:58
epoch [13/50] batch [1160/2000] time 2.060 (2.043) data 0.000 (0.001) loss 0.4099 (1.2303) lr 1.9048e-03 eta 1 day, 18:28:18
epoch [13/50] batch [1180/2000] time 2.040 (2.043) data 0.000 (0.001) loss 0.5671 (1.2344) lr 1.9048e-03 eta 1 day, 18:27:34
epoch [13/50] batch [1200/2000] time 2.042 (2.043) data 0.000 (0.001) loss 1.4770 (1.2364) lr 1.9048e-03 eta 1 day, 18:26:52
epoch [13/50] batch [1220/2000] time 2.021 (2.043) data 0.001 (0.001) loss 1.1915 (1.2373) lr 1.9048e-03 eta 1 day, 18:26:24
epoch [13/50] batch [1240/2000] time 2.064 (2.043) data 0.000 (0.001) loss 1.8942 (1.2339) lr 1.9048e-03 eta 1 day, 18:25:47
epoch [13/50] batch [1260/2000] time 2.064 (2.043) data 0.000 (0.001) loss 0.5777 (1.2292) lr 1.9048e-03 eta 1 day, 18:25:06
epoch [13/50] batch [1280/2000] time 2.021 (2.043) data 0.000 (0.001) loss 0.6637 (1.2324) lr 1.9048e-03 eta 1 day, 18:24:20
epoch [13/50] batch [1300/2000] time 2.039 (2.043) data 0.000 (0.001) loss 1.3987 (1.2350) lr 1.9048e-03 eta 1 day, 18:23:33
epoch [13/50] batch [1320/2000] time 2.038 (2.043) data 0.000 (0.001) loss 0.1187 (1.2405) lr 1.9048e-03 eta 1 day, 18:22:51
epoch [13/50] batch [1340/2000] time 2.036 (2.043) data 0.000 (0.001) loss 0.3322 (1.2423) lr 1.9048e-03 eta 1 day, 18:22:17
epoch [13/50] batch [1360/2000] time 2.031 (2.043) data 0.000 (0.001) loss 0.6751 (1.2411) lr 1.9048e-03 eta 1 day, 18:21:34
epoch [13/50] batch [1380/2000] time 2.039 (2.043) data 0.000 (0.001) loss 1.2864 (1.2383) lr 1.9048e-03 eta 1 day, 18:20:53
epoch [13/50] batch [1400/2000] time 2.061 (2.043) data 0.000 (0.001) loss 1.7127 (1.2372) lr 1.9048e-03 eta 1 day, 18:20:05
epoch [13/50] batch [1420/2000] time 2.074 (2.043) data 0.007 (0.001) loss 0.5132 (1.2361) lr 1.9048e-03 eta 1 day, 18:19:23
epoch [13/50] batch [1440/2000] time 1.984 (2.043) data 0.000 (0.001) loss 0.4652 (1.2352) lr 1.9048e-03 eta 1 day, 18:18:43
epoch [13/50] batch [1460/2000] time 2.058 (2.043) data 0.000 (0.001) loss 1.6530 (1.2320) lr 1.9048e-03 eta 1 day, 18:17:57
epoch [13/50] batch [1480/2000] time 2.033 (2.043) data 0.000 (0.001) loss 0.2069 (1.2321) lr 1.9048e-03 eta 1 day, 18:17:14
epoch [13/50] batch [1500/2000] time 2.056 (2.043) data 0.000 (0.001) loss 0.2002 (1.2309) lr 1.9048e-03 eta 1 day, 18:16:31
epoch [13/50] batch [1520/2000] time 2.005 (2.043) data 0.000 (0.001) loss 0.8306 (1.2288) lr 1.9048e-03 eta 1 day, 18:15:41
epoch [13/50] batch [1540/2000] time 2.037 (2.043) data 0.000 (0.001) loss 1.7182 (1.2280) lr 1.9048e-03 eta 1 day, 18:14:58
epoch [13/50] batch [1560/2000] time 2.057 (2.043) data 0.000 (0.001) loss 1.6517 (1.2315) lr 1.9048e-03 eta 1 day, 18:14:14
epoch [13/50] batch [1580/2000] time 2.040 (2.043) data 0.000 (0.001) loss 1.0300 (1.2289) lr 1.9048e-03 eta 1 day, 18:13:27
epoch [13/50] batch [1600/2000] time 1.990 (2.042) data 0.000 (0.001) loss 2.3928 (1.2271) lr 1.9048e-03 eta 1 day, 18:12:37
epoch [13/50] batch [1620/2000] time 2.079 (2.042) data 0.000 (0.001) loss 1.1604 (1.2268) lr 1.9048e-03 eta 1 day, 18:11:53
epoch [13/50] batch [1640/2000] time 2.068 (2.042) data 0.000 (0.001) loss 0.9686 (1.2228) lr 1.9048e-03 eta 1 day, 18:11:18
epoch [13/50] batch [1660/2000] time 2.068 (2.043) data 0.000 (0.001) loss 1.1295 (1.2271) lr 1.9048e-03 eta 1 day, 18:10:48
epoch [13/50] batch [1680/2000] time 2.049 (2.043) data 0.001 (0.001) loss 1.5988 (1.2262) lr 1.9048e-03 eta 1 day, 18:10:17
epoch [13/50] batch [1700/2000] time 2.044 (2.043) data 0.000 (0.001) loss 2.7169 (1.2268) lr 1.9048e-03 eta 1 day, 18:09:43
epoch [13/50] batch [1720/2000] time 2.009 (2.043) data 0.000 (0.001) loss 1.4212 (1.2283) lr 1.9048e-03 eta 1 day, 18:09:02
epoch [13/50] batch [1740/2000] time 2.008 (2.043) data 0.000 (0.001) loss 2.2956 (1.2257) lr 1.9048e-03 eta 1 day, 18:08:18
epoch [13/50] batch [1760/2000] time 2.036 (2.043) data 0.000 (0.001) loss 1.2779 (1.2275) lr 1.9048e-03 eta 1 day, 18:07:35
epoch [13/50] batch [1780/2000] time 2.040 (2.043) data 0.000 (0.001) loss 0.2497 (1.2280) lr 1.9048e-03 eta 1 day, 18:06:52
epoch [13/50] batch [1800/2000] time 2.018 (2.043) data 0.000 (0.001) loss 0.6456 (1.2288) lr 1.9048e-03 eta 1 day, 18:06:14
epoch [13/50] batch [1820/2000] time 2.070 (2.043) data 0.000 (0.001) loss 1.2117 (1.2265) lr 1.9048e-03 eta 1 day, 18:05:35
epoch [13/50] batch [1840/2000] time 2.061 (2.043) data 0.000 (0.001) loss 0.9519 (1.2273) lr 1.9048e-03 eta 1 day, 18:04:51
epoch [13/50] batch [1860/2000] time 2.065 (2.043) data 0.001 (0.001) loss 0.4274 (1.2240) lr 1.9048e-03 eta 1 day, 18:04:07
epoch [13/50] batch [1880/2000] time 2.044 (2.043) data 0.000 (0.001) loss 2.4969 (1.2226) lr 1.9048e-03 eta 1 day, 18:03:20
epoch [13/50] batch [1900/2000] time 2.063 (2.043) data 0.000 (0.001) loss 0.6607 (1.2233) lr 1.9048e-03 eta 1 day, 18:02:37
epoch [13/50] batch [1920/2000] time 2.052 (2.043) data 0.000 (0.001) loss 0.4123 (1.2229) lr 1.9048e-03 eta 1 day, 18:01:56
epoch [13/50] batch [1940/2000] time 2.040 (2.043) data 0.000 (0.001) loss 0.1359 (1.2238) lr 1.9048e-03 eta 1 day, 18:01:12
epoch [13/50] batch [1960/2000] time 2.073 (2.043) data 0.000 (0.001) loss 1.2432 (1.2210) lr 1.9048e-03 eta 1 day, 18:00:30
epoch [13/50] batch [1980/2000] time 2.017 (2.042) data 0.000 (0.001) loss 0.6102 (1.2213) lr 1.9048e-03 eta 1 day, 17:59:38
epoch [13/50] batch [2000/2000] time 2.061 (2.042) data 0.000 (0.001) loss 1.7216 (1.2204) lr 1.8763e-03 eta 1 day, 17:58:59
epoch [14/50] batch [20/2000] time 2.066 (2.074) data 0.000 (0.029) loss 0.5181 (1.2155) lr 1.8763e-03 eta 1 day, 18:36:48
epoch [14/50] batch [40/2000] time 1.984 (2.064) data 0.000 (0.015) loss 0.0650 (1.0473) lr 1.8763e-03 eta 1 day, 18:24:37
epoch [14/50] batch [60/2000] time 2.010 (2.059) data 0.001 (0.010) loss 1.9485 (1.0222) lr 1.8763e-03 eta 1 day, 18:16:56
epoch [14/50] batch [80/2000] time 1.988 (2.056) data 0.000 (0.008) loss 1.3233 (1.0894) lr 1.8763e-03 eta 1 day, 18:13:02
epoch [14/50] batch [100/2000] time 2.009 (2.053) data 0.000 (0.006) loss 0.1372 (1.1183) lr 1.8763e-03 eta 1 day, 18:09:13
epoch [14/50] batch [120/2000] time 2.068 (2.053) data 0.000 (0.005) loss 0.4461 (1.1222) lr 1.8763e-03 eta 1 day, 18:07:34
epoch [14/50] batch [140/2000] time 2.007 (2.051) data 0.000 (0.005) loss 1.7202 (1.1600) lr 1.8763e-03 eta 1 day, 18:04:13
epoch [14/50] batch [160/2000] time 2.067 (2.050) data 0.000 (0.004) loss 2.4346 (1.2080) lr 1.8763e-03 eta 1 day, 18:02:43
epoch [14/50] batch [180/2000] time 2.078 (2.050) data 0.000 (0.004) loss 1.6871 (1.1788) lr 1.8763e-03 eta 1 day, 18:01:42
epoch [14/50] batch [200/2000] time 1.992 (2.049) data 0.000 (0.003) loss 0.3614 (1.1618) lr 1.8763e-03 eta 1 day, 18:00:38
epoch [14/50] batch [220/2000] time 2.068 (2.049) data 0.000 (0.003) loss 0.7485 (1.1599) lr 1.8763e-03 eta 1 day, 17:59:47
epoch [14/50] batch [240/2000] time 2.073 (2.049) data 0.000 (0.003) loss 0.4593 (1.1466) lr 1.8763e-03 eta 1 day, 17:58:52
epoch [14/50] batch [260/2000] time 2.020 (2.050) data 0.000 (0.003) loss 1.4607 (1.1590) lr 1.8763e-03 eta 1 day, 17:58:51
epoch [14/50] batch [280/2000] time 2.068 (2.049) data 0.000 (0.003) loss 2.6616 (1.1597) lr 1.8763e-03 eta 1 day, 17:57:50
epoch [14/50] batch [300/2000] time 2.072 (2.049) data 0.000 (0.002) loss 0.4731 (1.1860) lr 1.8763e-03 eta 1 day, 17:57:16
epoch [14/50] batch [320/2000] time 2.068 (2.049) data 0.000 (0.002) loss 0.0992 (1.1706) lr 1.8763e-03 eta 1 day, 17:56:42
epoch [14/50] batch [340/2000] time 2.053 (2.050) data 0.000 (0.002) loss 2.5911 (1.1743) lr 1.8763e-03 eta 1 day, 17:56:58
epoch [14/50] batch [360/2000] time 2.010 (2.051) data 0.000 (0.002) loss 0.9605 (1.1796) lr 1.8763e-03 eta 1 day, 17:57:34
epoch [14/50] batch [380/2000] time 2.060 (2.051) data 0.000 (0.002) loss 2.2309 (1.1723) lr 1.8763e-03 eta 1 day, 17:56:46
epoch [14/50] batch [400/2000] time 2.008 (2.051) data 0.000 (0.002) loss 0.2468 (1.1697) lr 1.8763e-03 eta 1 day, 17:55:33
epoch [14/50] batch [420/2000] time 2.060 (2.051) data 0.000 (0.002) loss 2.3304 (1.1785) lr 1.8763e-03 eta 1 day, 17:54:52
epoch [14/50] batch [440/2000] time 2.061 (2.050) data 0.000 (0.002) loss 1.1169 (1.1664) lr 1.8763e-03 eta 1 day, 17:53:24
epoch [14/50] batch [460/2000] time 2.047 (2.050) data 0.000 (0.002) loss 1.2125 (1.1647) lr 1.8763e-03 eta 1 day, 17:52:17
epoch [14/50] batch [480/2000] time 1.983 (2.049) data 0.000 (0.002) loss 0.4131 (1.1656) lr 1.8763e-03 eta 1 day, 17:50:54
epoch [14/50] batch [500/2000] time 2.011 (2.049) data 0.000 (0.002) loss 1.6614 (1.1706) lr 1.8763e-03 eta 1 day, 17:50:04
epoch [14/50] batch [520/2000] time 2.062 (2.049) data 0.000 (0.002) loss 1.4038 (1.1658) lr 1.8763e-03 eta 1 day, 17:49:10
epoch [14/50] batch [540/2000] time 2.011 (2.049) data 0.000 (0.001) loss 1.4176 (1.1656) lr 1.8763e-03 eta 1 day, 17:48:35
epoch [14/50] batch [560/2000] time 2.063 (2.049) data 0.000 (0.001) loss 1.2314 (1.1618) lr 1.8763e-03 eta 1 day, 17:47:33
epoch [14/50] batch [580/2000] time 2.034 (2.048) data 0.000 (0.001) loss 2.0325 (1.1728) lr 1.8763e-03 eta 1 day, 17:46:37
epoch [14/50] batch [600/2000] time 2.039 (2.048) data 0.001 (0.001) loss 0.1274 (1.1717) lr 1.8763e-03 eta 1 day, 17:45:58
epoch [14/50] batch [620/2000] time 2.008 (2.048) data 0.000 (0.001) loss 1.4467 (1.1766) lr 1.8763e-03 eta 1 day, 17:44:53
epoch [14/50] batch [640/2000] time 2.039 (2.048) data 0.000 (0.001) loss 0.2884 (1.1730) lr 1.8763e-03 eta 1 day, 17:44:13
epoch [14/50] batch [660/2000] time 2.061 (2.048) data 0.000 (0.001) loss 0.4449 (1.1709) lr 1.8763e-03 eta 1 day, 17:43:25
epoch [14/50] batch [680/2000] time 1.986 (2.048) data 0.000 (0.001) loss 1.6667 (1.1687) lr 1.8763e-03 eta 1 day, 17:42:25
epoch [14/50] batch [700/2000] time 2.013 (2.048) data 0.000 (0.001) loss 0.6601 (1.1756) lr 1.8763e-03 eta 1 day, 17:41:32
epoch [14/50] batch [720/2000] time 2.010 (2.047) data 0.000 (0.001) loss 0.8090 (1.1850) lr 1.8763e-03 eta 1 day, 17:40:38
epoch [14/50] batch [740/2000] time 2.012 (2.048) data 0.000 (0.001) loss 0.2463 (1.1925) lr 1.8763e-03 eta 1 day, 17:40:01
epoch [14/50] batch [760/2000] time 2.059 (2.048) data 0.000 (0.001) loss 1.6505 (1.1967) lr 1.8763e-03 eta 1 day, 17:39:31
epoch [14/50] batch [780/2000] time 2.018 (2.047) data 0.000 (0.001) loss 2.6207 (1.1952) lr 1.8763e-03 eta 1 day, 17:38:28
epoch [14/50] batch [800/2000] time 2.051 (2.047) data 0.000 (0.001) loss 0.9469 (1.1957) lr 1.8763e-03 eta 1 day, 17:37:51
epoch [14/50] batch [820/2000] time 2.048 (2.047) data 0.000 (0.001) loss 0.8706 (1.1900) lr 1.8763e-03 eta 1 day, 17:37:13
epoch [14/50] batch [840/2000] time 2.064 (2.047) data 0.000 (0.001) loss 1.9448 (1.1876) lr 1.8763e-03 eta 1 day, 17:36:22
epoch [14/50] batch [860/2000] time 2.065 (2.047) data 0.000 (0.001) loss 1.4486 (1.1962) lr 1.8763e-03 eta 1 day, 17:35:36
epoch [14/50] batch [880/2000] time 2.042 (2.047) data 0.000 (0.001) loss 1.9840 (1.2022) lr 1.8763e-03 eta 1 day, 17:34:50
epoch [14/50] batch [900/2000] time 2.064 (2.047) data 0.000 (0.001) loss 1.3657 (1.2060) lr 1.8763e-03 eta 1 day, 17:34:10
epoch [14/50] batch [920/2000] time 2.079 (2.047) data 0.000 (0.001) loss 0.8264 (1.2086) lr 1.8763e-03 eta 1 day, 17:33:22
epoch [14/50] batch [940/2000] time 2.059 (2.047) data 0.000 (0.001) loss 1.0299 (1.1994) lr 1.8763e-03 eta 1 day, 17:32:41
epoch [14/50] batch [960/2000] time 2.061 (2.047) data 0.000 (0.001) loss 0.0774 (1.1986) lr 1.8763e-03 eta 1 day, 17:31:52
epoch [14/50] batch [980/2000] time 2.050 (2.047) data 0.000 (0.001) loss 1.2751 (1.2061) lr 1.8763e-03 eta 1 day, 17:31:07
epoch [14/50] batch [1000/2000] time 2.023 (2.047) data 0.000 (0.001) loss 2.5661 (1.2059) lr 1.8763e-03 eta 1 day, 17:30:28
epoch [14/50] batch [1020/2000] time 2.021 (2.047) data 0.000 (0.001) loss 1.3007 (1.2024) lr 1.8763e-03 eta 1 day, 17:29:38
epoch [14/50] batch [1040/2000] time 2.069 (2.047) data 0.000 (0.001) loss 2.5903 (1.2041) lr 1.8763e-03 eta 1 day, 17:28:56
epoch [14/50] batch [1060/2000] time 2.047 (2.047) data 0.001 (0.001) loss 0.8097 (1.2063) lr 1.8763e-03 eta 1 day, 17:28:37
epoch [14/50] batch [1080/2000] time 2.009 (2.047) data 0.000 (0.001) loss 1.3625 (1.2063) lr 1.8763e-03 eta 1 day, 17:27:53
epoch [14/50] batch [1100/2000] time 2.050 (2.047) data 0.000 (0.001) loss 0.8853 (1.2090) lr 1.8763e-03 eta 1 day, 17:27:08
epoch [14/50] batch [1120/2000] time 2.011 (2.047) data 0.000 (0.001) loss 0.6907 (1.2101) lr 1.8763e-03 eta 1 day, 17:26:26
epoch [14/50] batch [1140/2000] time 2.071 (2.047) data 0.001 (0.001) loss 0.8747 (1.2102) lr 1.8763e-03 eta 1 day, 17:25:34
epoch [14/50] batch [1160/2000] time 2.139 (2.047) data 0.000 (0.001) loss 0.1813 (1.2047) lr 1.8763e-03 eta 1 day, 17:24:51
epoch [14/50] batch [1180/2000] time 2.041 (2.047) data 0.000 (0.001) loss 1.5239 (1.2087) lr 1.8763e-03 eta 1 day, 17:24:10
epoch [14/50] batch [1200/2000] time 2.011 (2.047) data 0.000 (0.001) loss 0.2460 (1.2105) lr 1.8763e-03 eta 1 day, 17:23:30
epoch [14/50] batch [1220/2000] time 2.046 (2.047) data 0.000 (0.001) loss 2.7708 (1.2139) lr 1.8763e-03 eta 1 day, 17:23:24
epoch [14/50] batch [1240/2000] time 2.010 (2.047) data 0.000 (0.001) loss 3.9699 (1.2259) lr 1.8763e-03 eta 1 day, 17:22:45
epoch [14/50] batch [1260/2000] time 2.076 (2.047) data 0.000 (0.001) loss 0.2703 (1.2256) lr 1.8763e-03 eta 1 day, 17:22:00
epoch [14/50] batch [1280/2000] time 2.075 (2.047) data 0.000 (0.001) loss 1.1240 (1.2216) lr 1.8763e-03 eta 1 day, 17:21:26
epoch [14/50] batch [1300/2000] time 2.067 (2.047) data 0.000 (0.001) loss 1.0465 (1.2215) lr 1.8763e-03 eta 1 day, 17:20:50
epoch [14/50] batch [1320/2000] time 2.065 (2.047) data 0.000 (0.001) loss 0.1036 (1.2197) lr 1.8763e-03 eta 1 day, 17:20:09
epoch [14/50] batch [1340/2000] time 1.987 (2.047) data 0.000 (0.001) loss 0.2354 (1.2210) lr 1.8763e-03 eta 1 day, 17:19:20
epoch [14/50] batch [1360/2000] time 2.069 (2.047) data 0.000 (0.001) loss 0.2211 (1.2170) lr 1.8763e-03 eta 1 day, 17:18:47
epoch [14/50] batch [1380/2000] time 2.060 (2.047) data 0.000 (0.001) loss 0.7054 (1.2177) lr 1.8763e-03 eta 1 day, 17:17:57
epoch [14/50] batch [1400/2000] time 2.006 (2.047) data 0.000 (0.001) loss 0.3287 (1.2181) lr 1.8763e-03 eta 1 day, 17:17:09
epoch [14/50] batch [1420/2000] time 2.008 (2.047) data 0.000 (0.001) loss 0.4197 (1.2145) lr 1.8763e-03 eta 1 day, 17:16:31
epoch [14/50] batch [1440/2000] time 2.046 (2.047) data 0.000 (0.001) loss 3.3957 (1.2188) lr 1.8763e-03 eta 1 day, 17:16:06
epoch [14/50] batch [1460/2000] time 2.044 (2.048) data 0.000 (0.001) loss 2.5237 (1.2191) lr 1.8763e-03 eta 1 day, 17:15:26
epoch [14/50] batch [1480/2000] time 2.009 (2.047) data 0.000 (0.001) loss 1.9417 (1.2174) lr 1.8763e-03 eta 1 day, 17:14:36
epoch [14/50] batch [1500/2000] time 2.066 (2.047) data 0.000 (0.001) loss 1.6422 (1.2175) lr 1.8763e-03 eta 1 day, 17:13:59
epoch [14/50] batch [1520/2000] time 2.062 (2.047) data 0.000 (0.001) loss 0.9149 (1.2203) lr 1.8763e-03 eta 1 day, 17:13:08
epoch [14/50] batch [1540/2000] time 2.059 (2.047) data 0.000 (0.001) loss 0.4539 (1.2251) lr 1.8763e-03 eta 1 day, 17:12:19
epoch [14/50] batch [1560/2000] time 1.990 (2.047) data 0.000 (0.001) loss 0.8261 (1.2231) lr 1.8763e-03 eta 1 day, 17:11:25
epoch [14/50] batch [1580/2000] time 2.060 (2.047) data 0.000 (0.001) loss 0.9659 (1.2232) lr 1.8763e-03 eta 1 day, 17:10:33
epoch [14/50] batch [1600/2000] time 2.062 (2.047) data 0.000 (0.001) loss 1.2871 (1.2230) lr 1.8763e-03 eta 1 day, 17:09:42
epoch [14/50] batch [1620/2000] time 2.073 (2.047) data 0.000 (0.001) loss 0.4907 (1.2257) lr 1.8763e-03 eta 1 day, 17:08:57
epoch [14/50] batch [1640/2000] time 2.066 (2.047) data 0.000 (0.001) loss 1.8645 (1.2294) lr 1.8763e-03 eta 1 day, 17:08:09
epoch [14/50] batch [1660/2000] time 2.068 (2.047) data 0.000 (0.001) loss 0.4147 (1.2303) lr 1.8763e-03 eta 1 day, 17:07:30
epoch [14/50] batch [1680/2000] time 2.061 (2.047) data 0.001 (0.001) loss 1.6145 (1.2308) lr 1.8763e-03 eta 1 day, 17:06:43
epoch [14/50] batch [1700/2000] time 2.062 (2.046) data 0.000 (0.001) loss 2.0538 (1.2342) lr 1.8763e-03 eta 1 day, 17:05:56
epoch [14/50] batch [1720/2000] time 2.066 (2.046) data 0.000 (0.001) loss 1.1965 (1.2331) lr 1.8763e-03 eta 1 day, 17:05:15
epoch [14/50] batch [1740/2000] time 2.062 (2.046) data 0.000 (0.001) loss 1.2225 (1.2336) lr 1.8763e-03 eta 1 day, 17:04:29
epoch [14/50] batch [1760/2000] time 2.071 (2.046) data 0.000 (0.001) loss 0.7550 (1.2313) lr 1.8763e-03 eta 1 day, 17:03:46
epoch [14/50] batch [1780/2000] time 2.077 (2.046) data 0.000 (0.001) loss 0.5097 (1.2324) lr 1.8763e-03 eta 1 day, 17:03:05
epoch [14/50] batch [1800/2000] time 2.048 (2.046) data 0.000 (0.001) loss 1.3473 (1.2330) lr 1.8763e-03 eta 1 day, 17:02:25
epoch [14/50] batch [1820/2000] time 2.070 (2.046) data 0.001 (0.001) loss 0.9989 (1.2314) lr 1.8763e-03 eta 1 day, 17:01:51
epoch [14/50] batch [1840/2000] time 2.038 (2.046) data 0.000 (0.001) loss 0.2018 (1.2311) lr 1.8763e-03 eta 1 day, 17:01:04
epoch [14/50] batch [1860/2000] time 2.012 (2.046) data 0.000 (0.001) loss 0.1401 (1.2295) lr 1.8763e-03 eta 1 day, 17:00:17
epoch [14/50] batch [1880/2000] time 2.034 (2.046) data 0.000 (0.001) loss 0.2046 (1.2328) lr 1.8763e-03 eta 1 day, 16:59:37
epoch [14/50] batch [1900/2000] time 2.060 (2.046) data 0.000 (0.001) loss 2.7185 (1.2350) lr 1.8763e-03 eta 1 day, 16:58:55
epoch [14/50] batch [1920/2000] time 2.058 (2.046) data 0.000 (0.001) loss 0.1576 (1.2346) lr 1.8763e-03 eta 1 day, 16:58:07
epoch [14/50] batch [1940/2000] time 2.040 (2.046) data 0.000 (0.001) loss 1.1383 (1.2334) lr 1.8763e-03 eta 1 day, 16:57:20
epoch [14/50] batch [1960/2000] time 2.061 (2.046) data 0.000 (0.001) loss 1.2453 (1.2312) lr 1.8763e-03 eta 1 day, 16:56:35
epoch [14/50] batch [1980/2000] time 2.062 (2.046) data 0.000 (0.001) loss 1.3530 (1.2303) lr 1.8763e-03 eta 1 day, 16:55:49
epoch [14/50] batch [2000/2000] time 2.068 (2.046) data 0.000 (0.001) loss 1.6505 (1.2289) lr 1.8443e-03 eta 1 day, 16:55:03
epoch [15/50] batch [20/2000] time 2.018 (2.078) data 0.000 (0.030) loss 0.1710 (1.2278) lr 1.8443e-03 eta 1 day, 17:32:50
epoch [15/50] batch [40/2000] time 2.060 (2.068) data 0.000 (0.015) loss 4.1054 (1.3170) lr 1.8443e-03 eta 1 day, 17:19:39
epoch [15/50] batch [60/2000] time 2.014 (2.063) data 0.001 (0.011) loss 1.5738 (1.1445) lr 1.8443e-03 eta 1 day, 17:13:41
epoch [15/50] batch [80/2000] time 2.036 (2.060) data 0.000 (0.008) loss 1.2106 (1.1988) lr 1.8443e-03 eta 1 day, 17:09:30
epoch [15/50] batch [100/2000] time 2.062 (2.057) data 0.000 (0.007) loss 0.2303 (1.1771) lr 1.8443e-03 eta 1 day, 17:05:25
epoch [15/50] batch [120/2000] time 2.063 (2.055) data 0.000 (0.005) loss 0.0995 (1.1850) lr 1.8443e-03 eta 1 day, 17:02:01
epoch [15/50] batch [140/2000] time 2.070 (2.053) data 0.000 (0.005) loss 0.1009 (1.1892) lr 1.8443e-03 eta 1 day, 16:58:36
epoch [15/50] batch [160/2000] time 2.039 (2.051) data 0.000 (0.004) loss 0.3308 (1.1982) lr 1.8443e-03 eta 1 day, 16:55:43
epoch [15/50] batch [180/2000] time 2.015 (2.049) data 0.000 (0.004) loss 0.9150 (1.2211) lr 1.8443e-03 eta 1 day, 16:53:05
epoch [15/50] batch [200/2000] time 2.067 (2.047) data 0.000 (0.003) loss 0.7792 (1.2166) lr 1.8443e-03 eta 1 day, 16:50:08
epoch [15/50] batch [220/2000] time 2.014 (2.047) data 0.000 (0.003) loss 1.4277 (1.2263) lr 1.8443e-03 eta 1 day, 16:48:20
epoch [15/50] batch [240/2000] time 2.067 (2.046) data 0.000 (0.003) loss 0.9555 (1.2553) lr 1.8443e-03 eta 1 day, 16:47:05
epoch [15/50] batch [260/2000] time 2.066 (2.045) data 0.000 (0.003) loss 0.8389 (1.2499) lr 1.8443e-03 eta 1 day, 16:45:37
epoch [15/50] batch [280/2000] time 2.038 (2.045) data 0.000 (0.002) loss 2.4161 (1.2813) lr 1.8443e-03 eta 1 day, 16:44:42
epoch [15/50] batch [300/2000] time 2.004 (2.045) data 0.000 (0.002) loss 1.2877 (1.3160) lr 1.8443e-03 eta 1 day, 16:43:27
epoch [15/50] batch [320/2000] time 2.007 (2.045) data 0.000 (0.002) loss 3.1321 (1.3150) lr 1.8443e-03 eta 1 day, 16:42:59
epoch [15/50] batch [340/2000] time 2.036 (2.045) data 0.000 (0.002) loss 0.6888 (1.3119) lr 1.8443e-03 eta 1 day, 16:42:07
epoch [15/50] batch [360/2000] time 2.048 (2.045) data 0.000 (0.002) loss 3.2698 (1.3382) lr 1.8443e-03 eta 1 day, 16:41:27
epoch [15/50] batch [380/2000] time 1.990 (2.045) data 0.000 (0.002) loss 0.1256 (1.3513) lr 1.8443e-03 eta 1 day, 16:40:49
epoch [15/50] batch [400/2000] time 2.060 (2.045) data 0.000 (0.002) loss 4.6385 (1.3666) lr 1.8443e-03 eta 1 day, 16:40:25
epoch [15/50] batch [420/2000] time 2.051 (2.044) data 0.000 (0.002) loss 0.9795 (1.3497) lr 1.8443e-03 eta 1 day, 16:38:52
epoch [15/50] batch [440/2000] time 2.009 (2.044) data 0.000 (0.002) loss 1.0628 (1.3338) lr 1.8443e-03 eta 1 day, 16:37:51
epoch [15/50] batch [460/2000] time 2.060 (2.044) data 0.000 (0.002) loss 0.6118 (1.3360) lr 1.8443e-03 eta 1 day, 16:37:22
epoch [15/50] batch [480/2000] time 4.386 (2.084) data 0.000 (0.002) loss 0.2373 (1.3260) lr 1.8443e-03 eta 1 day, 17:23:59
epoch [15/50] batch [500/2000] time 4.338 (2.176) data 0.000 (0.002) loss 2.7542 (1.3280) lr 1.8443e-03 eta 1 day, 19:12:37
epoch [15/50] batch [520/2000] time 4.400 (2.260) data 0.000 (0.002) loss 1.8948 (1.3209) lr 1.8443e-03 eta 1 day, 20:52:46
epoch [15/50] batch [540/2000] time 4.328 (2.339) data 0.000 (0.001) loss 0.7156 (1.3115) lr 1.8443e-03 eta 1 day, 22:25:34
epoch [15/50] batch [560/2000] time 4.390 (2.411) data 0.000 (0.001) loss 5.3763 (1.3120) lr 1.8443e-03 eta 1 day, 23:50:47
epoch [15/50] batch [580/2000] time 4.354 (2.478) data 0.000 (0.001) loss 0.0847 (1.3096) lr 1.8443e-03 eta 2 days, 1:09:59
epoch [15/50] batch [600/2000] time 4.384 (2.541) data 0.001 (0.001) loss 1.3427 (1.3102) lr 1.8443e-03 eta 2 days, 2:24:16
epoch [15/50] batch [620/2000] time 4.375 (2.600) data 0.000 (0.001) loss 2.6311 (1.3224) lr 1.8443e-03 eta 2 days, 3:33:27
epoch [15/50] batch [640/2000] time 4.347 (2.656) data 0.000 (0.001) loss 0.5274 (1.3224) lr 1.8443e-03 eta 2 days, 4:38:23
epoch [15/50] batch [660/2000] time 4.395 (2.708) data 0.000 (0.001) loss 1.5001 (1.3244) lr 1.8443e-03 eta 2 days, 5:39:24
epoch [15/50] batch [680/2000] time 4.355 (2.757) data 0.000 (0.001) loss 1.0760 (1.3131) lr 1.8443e-03 eta 2 days, 6:36:38
epoch [15/50] batch [700/2000] time 4.354 (2.803) data 0.000 (0.001) loss 0.1788 (1.3163) lr 1.8443e-03 eta 2 days, 7:30:19
epoch [15/50] batch [720/2000] time 4.361 (2.846) data 0.000 (0.001) loss 0.0685 (1.3173) lr 1.8443e-03 eta 2 days, 8:21:14
epoch [15/50] batch [740/2000] time 4.385 (2.887) data 0.000 (0.001) loss 2.3097 (1.3217) lr 1.8443e-03 eta 2 days, 9:09:20
epoch [15/50] batch [760/2000] time 4.400 (2.927) data 0.000 (0.001) loss 1.0010 (1.3098) lr 1.8443e-03 eta 2 days, 9:55:08
epoch [15/50] batch [780/2000] time 4.377 (2.964) data 0.000 (0.001) loss 1.1395 (1.3068) lr 1.8443e-03 eta 2 days, 10:38:28
epoch [15/50] batch [800/2000] time 4.402 (3.000) data 0.000 (0.001) loss 0.1692 (1.3074) lr 1.8443e-03 eta 2 days, 11:19:34
epoch [15/50] batch [820/2000] time 4.360 (3.033) data 0.000 (0.001) loss 2.8546 (1.3089) lr 1.8443e-03 eta 2 days, 11:58:22
epoch [15/50] batch [840/2000] time 4.361 (3.065) data 0.000 (0.001) loss 1.2644 (1.2957) lr 1.8443e-03 eta 2 days, 12:35:11
epoch [15/50] batch [860/2000] time 4.425 (3.096) data 0.000 (0.001) loss 0.9493 (1.2990) lr 1.8443e-03 eta 2 days, 13:10:34
epoch [15/50] batch [880/2000] time 4.350 (3.125) data 0.000 (0.001) loss 3.1046 (1.3028) lr 1.8443e-03 eta 2 days, 13:44:06
epoch [15/50] batch [900/2000] time 4.405 (3.153) data 0.000 (0.001) loss 1.8705 (1.2961) lr 1.8443e-03 eta 2 days, 14:16:05
epoch [15/50] batch [920/2000] time 4.394 (3.179) data 0.000 (0.001) loss 0.6379 (1.2894) lr 1.8443e-03 eta 2 days, 14:46:34
epoch [15/50] batch [940/2000] time 4.394 (3.205) data 0.000 (0.001) loss 1.0846 (1.2892) lr 1.8443e-03 eta 2 days, 15:15:53
epoch [15/50] batch [960/2000] time 4.335 (3.229) data 0.000 (0.001) loss 1.2800 (1.2884) lr 1.8443e-03 eta 2 days, 15:43:36
epoch [15/50] batch [980/2000] time 4.380 (3.252) data 0.000 (0.001) loss 1.6874 (1.2915) lr 1.8443e-03 eta 2 days, 16:09:37
epoch [15/50] batch [1000/2000] time 4.381 (3.275) data 0.000 (0.001) loss 1.4552 (1.2896) lr 1.8443e-03 eta 2 days, 16:35:02
epoch [15/50] batch [1020/2000] time 4.385 (3.296) data 0.000 (0.001) loss 0.1415 (1.2808) lr 1.8443e-03 eta 2 days, 16:59:24
epoch [15/50] batch [1040/2000] time 4.370 (3.317) data 0.000 (0.001) loss 0.9104 (1.2760) lr 1.8443e-03 eta 2 days, 17:22:38
epoch [15/50] batch [1060/2000] time 4.405 (3.337) data 0.000 (0.001) loss 0.9362 (1.2731) lr 1.8443e-03 eta 2 days, 17:45:09
epoch [15/50] batch [1080/2000] time 4.372 (3.356) data 0.000 (0.001) loss 0.1750 (1.2719) lr 1.8443e-03 eta 2 days, 18:06:58
epoch [15/50] batch [1100/2000] time 4.397 (3.375) data 0.000 (0.001) loss 1.5265 (1.2719) lr 1.8443e-03 eta 2 days, 18:28:08
epoch [15/50] batch [1120/2000] time 4.370 (3.393) data 0.000 (0.001) loss 0.4038 (1.2649) lr 1.8443e-03 eta 2 days, 18:48:00
epoch [15/50] batch [1140/2000] time 4.369 (3.410) data 0.001 (0.001) loss 0.0787 (1.2600) lr 1.8443e-03 eta 2 days, 19:07:02
epoch [15/50] batch [1160/2000] time 4.341 (3.427) data 0.001 (0.001) loss 0.2171 (1.2577) lr 1.8443e-03 eta 2 days, 19:25:35
epoch [15/50] batch [1180/2000] time 4.406 (3.443) data 0.000 (0.001) loss 1.4423 (1.2555) lr 1.8443e-03 eta 2 days, 19:43:19
epoch [15/50] batch [1200/2000] time 4.403 (3.458) data 0.000 (0.001) loss 1.0141 (1.2635) lr 1.8443e-03 eta 2 days, 20:00:45
epoch [15/50] batch [1220/2000] time 4.395 (3.473) data 0.000 (0.001) loss 2.9780 (1.2675) lr 1.8443e-03 eta 2 days, 20:17:29
epoch [15/50] batch [1240/2000] time 4.373 (3.488) data 0.000 (0.001) loss 0.2395 (1.2664) lr 1.8443e-03 eta 2 days, 20:33:38
epoch [15/50] batch [1260/2000] time 4.349 (3.502) data 0.000 (0.001) loss 0.8829 (1.2655) lr 1.8443e-03 eta 2 days, 20:49:04
epoch [15/50] batch [1280/2000] time 4.411 (3.516) data 0.000 (0.001) loss 0.9594 (1.2687) lr 1.8443e-03 eta 2 days, 21:04:05
epoch [15/50] batch [1300/2000] time 4.386 (3.529) data 0.000 (0.001) loss 0.5119 (1.2644) lr 1.8443e-03 eta 2 days, 21:18:30
epoch [15/50] batch [1320/2000] time 4.383 (3.542) data 0.000 (0.001) loss 0.7281 (1.2675) lr 1.8443e-03 eta 2 days, 21:32:29
epoch [15/50] batch [1340/2000] time 4.397 (3.555) data 0.000 (0.001) loss 0.4019 (1.2676) lr 1.8443e-03 eta 2 days, 21:46:05
epoch [15/50] batch [1360/2000] time 4.327 (3.567) data 0.000 (0.001) loss 2.1193 (1.2691) lr 1.8443e-03 eta 2 days, 21:59:14
epoch [15/50] batch [1380/2000] time 4.429 (3.579) data 0.000 (0.001) loss 1.9451 (1.2662) lr 1.8443e-03 eta 2 days, 22:11:58
epoch [15/50] batch [1400/2000] time 4.375 (3.590) data 0.000 (0.001) loss 1.6025 (1.2680) lr 1.8443e-03 eta 2 days, 22:24:13
epoch [15/50] batch [1420/2000] time 4.416 (3.601) data 0.000 (0.001) loss 0.9784 (1.2633) lr 1.8443e-03 eta 2 days, 22:36:00
epoch [15/50] batch [1440/2000] time 4.405 (3.612) data 0.000 (0.001) loss 1.1768 (1.2620) lr 1.8443e-03 eta 2 days, 22:47:36
epoch [15/50] batch [1460/2000] time 4.486 (3.621) data 0.000 (0.001) loss 0.1855 (1.2587) lr 1.8443e-03 eta 2 days, 22:57:25
epoch [15/50] batch [1480/2000] time 4.475 (3.632) data 0.000 (0.001) loss 1.2142 (1.2564) lr 1.8443e-03 eta 2 days, 23:09:19
epoch [15/50] batch [1500/2000] time 4.373 (3.625) data 0.000 (0.001) loss 4.1143 (1.2552) lr 1.8443e-03 eta 2 days, 22:59:26
epoch [15/50] batch [1520/2000] time 4.391 (3.635) data 0.000 (0.001) loss 2.1505 (1.2579) lr 1.8443e-03 eta 2 days, 23:09:44
epoch [15/50] batch [1540/2000] time 4.388 (3.644) data 0.000 (0.001) loss 0.5617 (1.2577) lr 1.8443e-03 eta 2 days, 23:19:36
epoch [15/50] batch [1560/2000] time 4.379 (3.654) data 0.000 (0.001) loss 0.4375 (1.2614) lr 1.8443e-03 eta 2 days, 23:29:16
epoch [15/50] batch [1580/2000] time 4.389 (3.663) data 0.000 (0.001) loss 1.4307 (1.2641) lr 1.8443e-03 eta 2 days, 23:38:38
epoch [15/50] batch [1600/2000] time 4.309 (3.671) data 0.000 (0.001) loss 0.9713 (1.2617) lr 1.8443e-03 eta 2 days, 23:47:47
epoch [15/50] batch [1620/2000] time 4.424 (3.680) data 0.000 (0.001) loss 0.6140 (1.2608) lr 1.8443e-03 eta 2 days, 23:56:56
epoch [15/50] batch [1640/2000] time 4.364 (3.689) data 0.000 (0.001) loss 2.0275 (1.2605) lr 1.8443e-03 eta 3 days, 0:05:33
epoch [15/50] batch [1660/2000] time 4.415 (3.697) data 0.000 (0.001) loss 0.6918 (1.2601) lr 1.8443e-03 eta 3 days, 0:13:45
epoch [15/50] batch [1680/2000] time 4.383 (3.705) data 0.001 (0.001) loss 0.4843 (1.2604) lr 1.8443e-03 eta 3 days, 0:22:09
epoch [15/50] batch [1700/2000] time 4.372 (3.713) data 0.000 (0.001) loss 0.5212 (1.2584) lr 1.8443e-03 eta 3 days, 0:30:13
epoch [15/50] batch [1720/2000] time 4.401 (3.721) data 0.000 (0.001) loss 0.4115 (1.2612) lr 1.8443e-03 eta 3 days, 0:38:04
epoch [15/50] batch [1740/2000] time 4.371 (3.728) data 0.000 (0.001) loss 2.2279 (1.2608) lr 1.8443e-03 eta 3 days, 0:45:42
epoch [15/50] batch [1760/2000] time 4.403 (3.736) data 0.000 (0.001) loss 0.5233 (1.2606) lr 1.8443e-03 eta 3 days, 0:53:04
epoch [15/50] batch [1780/2000] time 4.377 (3.743) data 0.000 (0.001) loss 1.6485 (1.2572) lr 1.8443e-03 eta 3 days, 1:00:21
epoch [15/50] batch [1800/2000] time 4.328 (3.750) data 0.000 (0.001) loss 1.7803 (1.2563) lr 1.8443e-03 eta 3 days, 1:07:23
epoch [15/50] batch [1820/2000] time 4.348 (3.757) data 0.000 (0.001) loss 3.0059 (1.2541) lr 1.8443e-03 eta 3 days, 1:13:58
epoch [15/50] batch [1840/2000] time 4.377 (3.763) data 0.000 (0.001) loss 2.2150 (1.2530) lr 1.8443e-03 eta 3 days, 1:20:25
epoch [15/50] batch [1860/2000] time 4.323 (3.770) data 0.000 (0.001) loss 0.4143 (1.2497) lr 1.8443e-03 eta 3 days, 1:26:41
epoch [15/50] batch [1880/2000] time 4.419 (3.776) data 0.000 (0.001) loss 0.0202 (1.2487) lr 1.8443e-03 eta 3 days, 1:33:07
epoch [15/50] batch [1900/2000] time 4.323 (3.782) data 0.000 (0.001) loss 0.1683 (1.2457) lr 1.8443e-03 eta 3 days, 1:39:08
epoch [15/50] batch [1920/2000] time 4.371 (3.788) data 0.000 (0.001) loss 0.4900 (1.2471) lr 1.8443e-03 eta 3 days, 1:44:54
epoch [15/50] batch [1940/2000] time 4.359 (3.794) data 0.000 (0.001) loss 2.5055 (1.2474) lr 1.8443e-03 eta 3 days, 1:50:38
epoch [15/50] batch [1960/2000] time 4.384 (3.800) data 0.000 (0.001) loss 2.5643 (1.2473) lr 1.8443e-03 eta 3 days, 1:56:22
epoch [15/50] batch [1980/2000] time 4.381 (3.806) data 0.000 (0.001) loss 0.8046 (1.2442) lr 1.8443e-03 eta 3 days, 2:01:45
epoch [15/50] batch [2000/2000] time 4.337 (3.811) data 0.000 (0.001) loss 1.3786 (1.2441) lr 1.8090e-03 eta 3 days, 2:06:33
epoch [16/50] batch [20/2000] time 4.360 (4.401) data 0.000 (0.030) loss 1.6123 (1.1282) lr 1.8090e-03 eta 3 days, 13:32:43
epoch [16/50] batch [40/2000] time 4.389 (4.383) data 0.000 (0.015) loss 0.5535 (1.1038) lr 1.8090e-03 eta 3 days, 13:10:32
epoch [16/50] batch [60/2000] time 4.381 (4.377) data 0.001 (0.011) loss 0.9865 (1.1107) lr 1.8090e-03 eta 3 days, 13:01:37
epoch [16/50] batch [80/2000] time 4.387 (4.377) data 0.000 (0.008) loss 2.0277 (1.2099) lr 1.8090e-03 eta 3 days, 13:00:09
epoch [16/50] batch [100/2000] time 4.368 (4.375) data 0.000 (0.006) loss 0.6856 (1.1935) lr 1.8090e-03 eta 3 days, 12:57:23
epoch [16/50] batch [120/2000] time 4.391 (4.374) data 0.000 (0.005) loss 1.2586 (1.1349) lr 1.8090e-03 eta 3 days, 12:54:39
epoch [16/50] batch [140/2000] time 4.380 (4.374) data 0.000 (0.005) loss 0.0605 (1.1362) lr 1.8090e-03 eta 3 days, 12:52:39
epoch [16/50] batch [160/2000] time 4.317 (4.372) data 0.000 (0.004) loss 1.7232 (1.1166) lr 1.8090e-03 eta 3 days, 12:49:34
epoch [16/50] batch [180/2000] time 4.365 (4.372) data 0.000 (0.004) loss 4.4206 (1.1469) lr 1.8090e-03 eta 3 days, 12:47:42
epoch [16/50] batch [200/2000] time 4.389 (4.371) data 0.000 (0.003) loss 1.6956 (1.1811) lr 1.8090e-03 eta 3 days, 12:44:47
epoch [16/50] batch [220/2000] time 4.381 (4.370) data 0.000 (0.003) loss 0.7493 (1.1985) lr 1.8090e-03 eta 3 days, 12:42:32
epoch [16/50] batch [240/2000] time 4.322 (4.371) data 0.000 (0.003) loss 0.4298 (1.2078) lr 1.8090e-03 eta 3 days, 12:41:45
epoch [16/50] batch [260/2000] time 4.342 (4.371) data 0.000 (0.003) loss 1.8407 (1.2013) lr 1.8090e-03 eta 3 days, 12:40:26
epoch [16/50] batch [280/2000] time 4.370 (4.371) data 0.000 (0.003) loss 0.6420 (1.1775) lr 1.8090e-03 eta 3 days, 12:39:39
epoch [16/50] batch [300/2000] time 4.357 (4.371) data 0.000 (0.002) loss 1.0685 (1.1770) lr 1.8090e-03 eta 3 days, 12:37:40
epoch [16/50] batch [320/2000] time 4.364 (4.371) data 0.000 (0.002) loss 2.8563 (1.1721) lr 1.8090e-03 eta 3 days, 12:35:57
epoch [16/50] batch [340/2000] time 4.337 (4.371) data 0.000 (0.002) loss 2.3267 (1.1823) lr 1.8090e-03 eta 3 days, 12:34:09
epoch [16/50] batch [360/2000] time 4.370 (4.370) data 0.000 (0.002) loss 0.3088 (1.1899) lr 1.8090e-03 eta 3 days, 12:32:19
epoch [16/50] batch [380/2000] time 4.383 (4.371) data 0.000 (0.002) loss 0.9959 (1.1806) lr 1.8090e-03 eta 3 days, 12:31:18
epoch [16/50] batch [400/2000] time 4.361 (4.370) data 0.000 (0.002) loss 0.5723 (1.2019) lr 1.8090e-03 eta 3 days, 12:29:25
epoch [16/50] batch [420/2000] time 4.356 (4.370) data 0.000 (0.002) loss 0.3370 (1.2053) lr 1.8090e-03 eta 3 days, 12:27:48
epoch [16/50] batch [440/2000] time 4.339 (4.370) data 0.000 (0.002) loss 0.6871 (1.2134) lr 1.8090e-03 eta 3 days, 12:25:59
epoch [16/50] batch [460/2000] time 4.324 (4.369) data 0.000 (0.002) loss 1.4328 (1.2181) lr 1.8090e-03 eta 3 days, 12:24:01
epoch [16/50] batch [480/2000] time 4.457 (4.365) data 0.004 (0.002) loss 1.4717 (1.2151) lr 1.8090e-03 eta 3 days, 12:17:50
epoch [16/50] batch [500/2000] time 4.470 (4.368) data 0.000 (0.002) loss 0.5426 (1.2234) lr 1.8090e-03 eta 3 days, 12:19:46
epoch [16/50] batch [520/2000] time 4.325 (4.321) data 0.000 (0.002) loss 1.6184 (1.2359) lr 1.8090e-03 eta 3 days, 11:24:05
epoch [16/50] batch [540/2000] time 4.353 (4.323) data 0.000 (0.002) loss 0.4610 (1.2207) lr 1.8090e-03 eta 3 days, 11:24:28
epoch [16/50] batch [560/2000] time 4.401 (4.324) data 0.000 (0.001) loss 0.0575 (1.2268) lr 1.8090e-03 eta 3 days, 11:24:39
epoch [16/50] batch [580/2000] time 4.407 (4.326) data 0.000 (0.001) loss 0.8721 (1.2290) lr 1.8090e-03 eta 3 days, 11:25:34
epoch [16/50] batch [600/2000] time 4.422 (4.329) data 0.001 (0.001) loss 0.8649 (1.2126) lr 1.8090e-03 eta 3 days, 11:26:46
epoch [16/50] batch [620/2000] time 4.363 (4.330) data 0.000 (0.001) loss 0.6572 (1.2170) lr 1.8090e-03 eta 3 days, 11:27:24
epoch [16/50] batch [640/2000] time 4.369 (4.333) data 0.000 (0.001) loss 0.0531 (1.2083) lr 1.8090e-03 eta 3 days, 11:28:28
epoch [16/50] batch [660/2000] time 4.416 (4.334) data 0.000 (0.001) loss 2.0252 (1.2052) lr 1.8090e-03 eta 3 days, 11:28:41
epoch [16/50] batch [680/2000] time 4.419 (4.336) data 0.000 (0.001) loss 0.8867 (1.2027) lr 1.8090e-03 eta 3 days, 11:29:07
epoch [16/50] batch [700/2000] time 4.333 (4.337) data 0.000 (0.001) loss 1.3740 (1.2019) lr 1.8090e-03 eta 3 days, 11:29:15
epoch [16/50] batch [720/2000] time 4.362 (4.338) data 0.000 (0.001) loss 0.1483 (1.1983) lr 1.8090e-03 eta 3 days, 11:29:11
epoch [16/50] batch [740/2000] time 4.410 (4.339) data 0.000 (0.001) loss 3.0034 (1.1967) lr 1.8090e-03 eta 3 days, 11:29:06
epoch [16/50] batch [760/2000] time 4.423 (4.341) data 0.001 (0.001) loss 0.6312 (1.2017) lr 1.8090e-03 eta 3 days, 11:29:16
epoch [16/50] batch [780/2000] time 4.378 (4.342) data 0.000 (0.001) loss 0.5399 (1.1986) lr 1.8090e-03 eta 3 days, 11:29:17
epoch [16/50] batch [800/2000] time 4.370 (4.344) data 0.000 (0.001) loss 2.5847 (1.1948) lr 1.8090e-03 eta 3 days, 11:29:34
epoch [16/50] batch [820/2000] time 4.331 (4.344) data 0.000 (0.001) loss 0.3023 (1.2027) lr 1.8090e-03 eta 3 days, 11:28:46
epoch [16/50] batch [840/2000] time 4.395 (4.345) data 0.004 (0.001) loss 2.6043 (1.2033) lr 1.8090e-03 eta 3 days, 11:28:16
epoch [16/50] batch [860/2000] time 4.400 (4.346) data 0.000 (0.001) loss 0.0126 (1.2004) lr 1.8090e-03 eta 3 days, 11:27:46
epoch [16/50] batch [880/2000] time 4.403 (4.347) data 0.000 (0.001) loss 0.1328 (1.2008) lr 1.8090e-03 eta 3 days, 11:27:12
epoch [16/50] batch [900/2000] time 4.366 (4.347) data 0.000 (0.001) loss 1.5897 (1.2014) lr 1.8090e-03 eta 3 days, 11:26:38
epoch [16/50] batch [920/2000] time 4.380 (4.348) data 0.000 (0.001) loss 3.1371 (1.2023) lr 1.8090e-03 eta 3 days, 11:25:46
epoch [16/50] batch [940/2000] time 4.339 (4.349) data 0.000 (0.001) loss 0.2842 (1.1994) lr 1.8090e-03 eta 3 days, 11:25:07
epoch [16/50] batch [960/2000] time 4.336 (4.349) data 0.000 (0.001) loss 0.8588 (1.2056) lr 1.8090e-03 eta 3 days, 11:24:20
epoch [16/50] batch [980/2000] time 4.322 (4.350) data 0.000 (0.001) loss 1.5636 (1.2061) lr 1.8090e-03 eta 3 days, 11:23:31
epoch [16/50] batch [1000/2000] time 4.417 (4.350) data 0.000 (0.001) loss 0.5141 (1.2026) lr 1.8090e-03 eta 3 days, 11:22:51
epoch [16/50] batch [1020/2000] time 4.385 (4.350) data 0.000 (0.001) loss 0.3646 (1.2033) lr 1.8090e-03 eta 3 days, 11:21:05
epoch [16/50] batch [1040/2000] time 4.365 (4.351) data 0.000 (0.001) loss 1.4219 (1.2098) lr 1.8090e-03 eta 3 days, 11:20:24
epoch [16/50] batch [1060/2000] time 4.399 (4.351) data 0.000 (0.001) loss 1.4793 (1.2121) lr 1.8090e-03 eta 3 days, 11:19:46
epoch [16/50] batch [1080/2000] time 4.371 (4.352) data 0.003 (0.001) loss 1.5818 (1.2065) lr 1.8090e-03 eta 3 days, 11:19:01
epoch [16/50] batch [1100/2000] time 4.338 (4.353) data 0.000 (0.001) loss 1.1113 (1.2087) lr 1.8090e-03 eta 3 days, 11:18:08
epoch [16/50] batch [1120/2000] time 4.385 (4.353) data 0.000 (0.001) loss 2.8838 (1.2110) lr 1.8090e-03 eta 3 days, 11:17:18
epoch [16/50] batch [1140/2000] time 4.416 (4.354) data 0.001 (0.001) loss 0.3428 (1.2145) lr 1.8090e-03 eta 3 days, 11:16:28
epoch [16/50] batch [1160/2000] time 4.393 (4.354) data 0.000 (0.001) loss 0.2138 (1.2093) lr 1.8090e-03 eta 3 days, 11:15:38
epoch [16/50] batch [1180/2000] time 4.385 (4.355) data 0.001 (0.001) loss 0.7865 (1.2136) lr 1.8090e-03 eta 3 days, 11:14:45
epoch [16/50] batch [1200/2000] time 4.406 (4.355) data 0.000 (0.001) loss 0.4950 (1.2120) lr 1.8090e-03 eta 3 days, 11:13:45
epoch [16/50] batch [1220/2000] time 4.407 (4.355) data 0.000 (0.001) loss 0.5303 (1.2162) lr 1.8090e-03 eta 3 days, 11:12:42
epoch [16/50] batch [1240/2000] time 4.394 (4.356) data 0.000 (0.001) loss 0.6304 (1.2121) lr 1.8090e-03 eta 3 days, 11:11:48
epoch [16/50] batch [1260/2000] time 4.384 (4.356) data 0.000 (0.001) loss 0.2962 (1.2078) lr 1.8090e-03 eta 3 days, 11:10:44
epoch [16/50] batch [1280/2000] time 4.305 (4.356) data 0.000 (0.001) loss 1.6818 (1.2046) lr 1.8090e-03 eta 3 days, 11:09:37
epoch [16/50] batch [1300/2000] time 4.388 (4.357) data 0.000 (0.001) loss 0.1991 (1.2061) lr 1.8090e-03 eta 3 days, 11:08:35
epoch [16/50] batch [1320/2000] time 4.321 (4.357) data 0.000 (0.001) loss 2.8596 (1.2125) lr 1.8090e-03 eta 3 days, 11:07:21
epoch [16/50] batch [1340/2000] time 4.362 (4.357) data 0.000 (0.001) loss 3.3709 (1.2118) lr 1.8090e-03 eta 3 days, 11:06:15
epoch [16/50] batch [1360/2000] time 4.402 (4.358) data 0.000 (0.001) loss 0.1002 (1.2126) lr 1.8090e-03 eta 3 days, 11:05:17
epoch [16/50] batch [1380/2000] time 4.361 (4.358) data 0.000 (0.001) loss 1.1829 (1.2086) lr 1.8090e-03 eta 3 days, 11:04:00
epoch [16/50] batch [1400/2000] time 4.426 (4.358) data 0.015 (0.001) loss 1.0960 (1.2125) lr 1.8090e-03 eta 3 days, 11:02:53
epoch [16/50] batch [1420/2000] time 4.394 (4.359) data 0.000 (0.001) loss 0.0460 (1.2103) lr 1.8090e-03 eta 3 days, 11:01:59
epoch [16/50] batch [1440/2000] time 4.367 (4.359) data 0.000 (0.001) loss 0.9515 (1.2118) lr 1.8090e-03 eta 3 days, 11:00:40
epoch [16/50] batch [1460/2000] time 4.394 (4.359) data 0.000 (0.001) loss 2.8526 (1.2167) lr 1.8090e-03 eta 3 days, 10:59:28
epoch [16/50] batch [1480/2000] time 4.411 (4.359) data 0.000 (0.001) loss 0.7334 (1.2144) lr 1.8090e-03 eta 3 days, 10:58:16
epoch [16/50] batch [1500/2000] time 4.439 (4.358) data 0.000 (0.001) loss 2.1359 (1.2171) lr 1.8090e-03 eta 3 days, 10:55:32
epoch [16/50] batch [1520/2000] time 4.470 (4.359) data 0.000 (0.001) loss 0.4859 (1.2104) lr 1.8090e-03 eta 3 days, 10:55:20
epoch [16/50] batch [1540/2000] time 2.060 (4.342) data 0.001 (0.001) loss 1.5426 (1.2073) lr 1.8090e-03 eta 3 days, 10:34:07
epoch [16/50] batch [1560/2000] time 2.061 (4.312) data 0.000 (0.001) loss 2.2893 (1.2028) lr 1.8090e-03 eta 3 days, 9:59:00
epoch [16/50] batch [1580/2000] time 2.005 (4.284) data 0.000 (0.001) loss 0.1534 (1.1988) lr 1.8090e-03 eta 3 days, 9:24:40
epoch [16/50] batch [1600/2000] time 2.057 (4.255) data 0.000 (0.001) loss 1.9849 (1.1968) lr 1.8090e-03 eta 3 days, 8:51:13
epoch [16/50] batch [1620/2000] time 1.986 (4.228) data 0.000 (0.001) loss 0.9714 (1.1986) lr 1.8090e-03 eta 3 days, 8:18:34
epoch [16/50] batch [1640/2000] time 2.056 (4.201) data 0.000 (0.001) loss 1.7669 (1.2012) lr 1.8090e-03 eta 3 days, 7:46:46
epoch [16/50] batch [1660/2000] time 2.010 (4.175) data 0.000 (0.001) loss 0.6042 (1.1996) lr 1.8090e-03 eta 3 days, 7:15:40
epoch [16/50] batch [1680/2000] time 2.057 (4.150) data 0.001 (0.001) loss 1.4486 (1.2011) lr 1.8090e-03 eta 3 days, 6:45:14
epoch [16/50] batch [1700/2000] time 1.984 (4.125) data 0.000 (0.001) loss 1.4119 (1.2021) lr 1.8090e-03 eta 3 days, 6:15:37
epoch [16/50] batch [1720/2000] time 2.004 (4.101) data 0.000 (0.001) loss 0.6161 (1.2050) lr 1.8090e-03 eta 3 days, 5:46:42
epoch [16/50] batch [1740/2000] time 2.063 (4.077) data 0.000 (0.001) loss 1.7373 (1.2088) lr 1.8090e-03 eta 3 days, 5:18:24
epoch [16/50] batch [1760/2000] time 2.012 (4.054) data 0.000 (0.001) loss 1.1010 (1.2104) lr 1.8090e-03 eta 3 days, 4:50:42
epoch [16/50] batch [1780/2000] time 2.068 (4.031) data 0.000 (0.001) loss 1.0283 (1.2094) lr 1.8090e-03 eta 3 days, 4:23:48
epoch [16/50] batch [1800/2000] time 2.041 (4.009) data 0.001 (0.001) loss 0.9791 (1.2079) lr 1.8090e-03 eta 3 days, 3:57:19
epoch [16/50] batch [1820/2000] time 2.014 (3.988) data 0.000 (0.001) loss 0.8712 (1.2070) lr 1.8090e-03 eta 3 days, 3:31:23
epoch [16/50] batch [1840/2000] time 2.074 (3.967) data 0.000 (0.001) loss 0.0123 (1.2065) lr 1.8090e-03 eta 3 days, 3:06:07
epoch [16/50] batch [1860/2000] time 2.012 (3.946) data 0.000 (0.001) loss 0.8856 (1.2058) lr 1.8090e-03 eta 3 days, 2:41:25
epoch [16/50] batch [1880/2000] time 2.066 (3.926) data 0.000 (0.001) loss 1.0413 (1.2036) lr 1.8090e-03 eta 3 days, 2:17:09
epoch [16/50] batch [1900/2000] time 2.064 (3.906) data 0.000 (0.001) loss 1.2449 (1.2026) lr 1.8090e-03 eta 3 days, 1:53:24
epoch [16/50] batch [1920/2000] time 2.058 (3.887) data 0.000 (0.001) loss 1.6284 (1.2021) lr 1.8090e-03 eta 3 days, 1:29:59
epoch [16/50] batch [1940/2000] time 2.062 (3.868) data 0.000 (0.001) loss 1.7076 (1.2043) lr 1.8090e-03 eta 3 days, 1:07:04
epoch [16/50] batch [1960/2000] time 2.005 (3.849) data 0.000 (0.001) loss 0.7309 (1.2050) lr 1.8090e-03 eta 3 days, 0:44:35
epoch [16/50] batch [1980/2000] time 2.009 (3.830) data 0.000 (0.001) loss 1.5471 (1.2099) lr 1.8090e-03 eta 3 days, 0:22:29
epoch [16/50] batch [2000/2000] time 2.052 (3.813) data 0.000 (0.001) loss 0.3767 (1.2080) lr 1.7705e-03 eta 3 days, 0:00:50
epoch [17/50] batch [20/2000] time 2.037 (2.075) data 0.000 (0.030) loss 2.1028 (1.3321) lr 1.7705e-03 eta 1 day, 15:11:06
epoch [17/50] batch [40/2000] time 2.004 (2.058) data 0.000 (0.015) loss 0.8656 (1.1753) lr 1.7705e-03 eta 1 day, 14:51:22
epoch [17/50] batch [60/2000] time 2.077 (2.053) data 0.001 (0.010) loss 0.6734 (1.1793) lr 1.7705e-03 eta 1 day, 14:44:45
epoch [17/50] batch [80/2000] time 2.007 (2.048) data 0.000 (0.008) loss 2.3335 (1.2285) lr 1.7705e-03 eta 1 day, 14:38:38
epoch [17/50] batch [100/2000] time 2.056 (2.045) data 0.000 (0.006) loss 1.6329 (1.1766) lr 1.7705e-03 eta 1 day, 14:34:01
epoch [17/50] batch [120/2000] time 2.004 (2.045) data 0.000 (0.005) loss 3.0567 (1.2170) lr 1.7705e-03 eta 1 day, 14:33:24
epoch [17/50] batch [140/2000] time 2.056 (2.044) data 0.000 (0.005) loss 0.5675 (1.1908) lr 1.7705e-03 eta 1 day, 14:32:03
epoch [17/50] batch [160/2000] time 2.059 (2.044) data 0.000 (0.004) loss 1.2584 (1.2028) lr 1.7705e-03 eta 1 day, 14:31:27
epoch [17/50] batch [180/2000] time 2.066 (2.043) data 0.000 (0.004) loss 2.4718 (1.2076) lr 1.7705e-03 eta 1 day, 14:29:17
epoch [17/50] batch [200/2000] time 2.058 (2.043) data 0.000 (0.003) loss 1.7634 (1.2181) lr 1.7705e-03 eta 1 day, 14:28:09
epoch [17/50] batch [220/2000] time 2.004 (2.042) data 0.000 (0.003) loss 1.3069 (1.2148) lr 1.7705e-03 eta 1 day, 14:27:15
epoch [17/50] batch [240/2000] time 2.008 (2.041) data 0.000 (0.003) loss 0.3276 (1.2346) lr 1.7705e-03 eta 1 day, 14:25:25
epoch [17/50] batch [260/2000] time 2.041 (2.042) data 0.000 (0.003) loss 1.3416 (1.2126) lr 1.7705e-03 eta 1 day, 14:24:51
epoch [17/50] batch [280/2000] time 2.031 (2.041) data 0.000 (0.002) loss 1.1644 (1.2147) lr 1.7705e-03 eta 1 day, 14:23:49
epoch [17/50] batch [300/2000] time 1.976 (2.040) data 0.000 (0.002) loss 0.8828 (1.2187) lr 1.7705e-03 eta 1 day, 14:22:21
epoch [17/50] batch [320/2000] time 2.054 (2.040) data 0.000 (0.002) loss 0.2470 (1.2185) lr 1.7705e-03 eta 1 day, 14:21:06
epoch [17/50] batch [340/2000] time 2.033 (2.040) data 0.000 (0.002) loss 0.4904 (1.2080) lr 1.7705e-03 eta 1 day, 14:20:01
epoch [17/50] batch [360/2000] time 2.032 (2.039) data 0.000 (0.002) loss 0.4401 (1.2055) lr 1.7705e-03 eta 1 day, 14:19:07
epoch [17/50] batch [380/2000] time 2.056 (2.039) data 0.000 (0.002) loss 1.6145 (1.2086) lr 1.7705e-03 eta 1 day, 14:18:10
epoch [17/50] batch [400/2000] time 1.984 (2.039) data 0.000 (0.002) loss 1.1334 (1.2197) lr 1.7705e-03 eta 1 day, 14:17:08
epoch [17/50] batch [420/2000] time 2.034 (2.039) data 0.000 (0.002) loss 0.6210 (1.1966) lr 1.7705e-03 eta 1 day, 14:16:16
epoch [17/50] batch [440/2000] time 2.000 (2.038) data 0.000 (0.002) loss 0.5122 (1.1969) lr 1.7705e-03 eta 1 day, 14:14:57
epoch [17/50] batch [460/2000] time 2.004 (2.038) data 0.000 (0.002) loss 0.1662 (1.1920) lr 1.7705e-03 eta 1 day, 14:14:31
epoch [17/50] batch [480/2000] time 2.035 (2.039) data 0.000 (0.002) loss 2.2206 (1.2018) lr 1.7705e-03 eta 1 day, 14:14:00
epoch [17/50] batch [500/2000] time 2.061 (2.039) data 0.000 (0.001) loss 2.3079 (1.2080) lr 1.7705e-03 eta 1 day, 14:13:24
epoch [17/50] batch [520/2000] time 2.062 (2.039) data 0.000 (0.001) loss 0.4972 (1.2097) lr 1.7705e-03 eta 1 day, 14:12:49
epoch [17/50] batch [540/2000] time 2.066 (2.039) data 0.000 (0.001) loss 0.1140 (1.2116) lr 1.7705e-03 eta 1 day, 14:12:21
epoch [17/50] batch [560/2000] time 2.009 (2.039) data 0.000 (0.001) loss 0.5034 (1.2099) lr 1.7705e-03 eta 1 day, 14:11:34
epoch [17/50] batch [580/2000] time 2.059 (2.039) data 0.001 (0.001) loss 0.1750 (1.2027) lr 1.7705e-03 eta 1 day, 14:10:36
epoch [17/50] batch [600/2000] time 2.042 (2.039) data 0.001 (0.001) loss 1.0099 (1.1939) lr 1.7705e-03 eta 1 day, 14:10:11
epoch [17/50] batch [620/2000] time 2.015 (2.039) data 0.000 (0.001) loss 1.9073 (1.1897) lr 1.7705e-03 eta 1 day, 14:09:44
epoch [17/50] batch [640/2000] time 2.016 (2.039) data 0.000 (0.001) loss 1.3664 (1.1887) lr 1.7705e-03 eta 1 day, 14:09:08
epoch [17/50] batch [660/2000] time 2.006 (2.039) data 0.000 (0.001) loss 0.2922 (1.1960) lr 1.7705e-03 eta 1 day, 14:08:26
epoch [17/50] batch [680/2000] time 2.082 (2.039) data 0.000 (0.001) loss 0.4831 (1.1912) lr 1.7705e-03 eta 1 day, 14:07:51
epoch [17/50] batch [700/2000] time 2.012 (2.039) data 0.000 (0.001) loss 1.9677 (1.2038) lr 1.7705e-03 eta 1 day, 14:07:33
epoch [17/50] batch [720/2000] time 2.039 (2.040) data 0.000 (0.001) loss 0.7576 (1.1963) lr 1.7705e-03 eta 1 day, 14:06:59
epoch [17/50] batch [740/2000] time 2.060 (2.040) data 0.000 (0.001) loss 0.3809 (1.1837) lr 1.7705e-03 eta 1 day, 14:06:20
epoch [17/50] batch [760/2000] time 2.070 (2.040) data 0.000 (0.001) loss 0.8202 (1.1798) lr 1.7705e-03 eta 1 day, 14:05:41
epoch [17/50] batch [780/2000] time 2.058 (2.040) data 0.000 (0.001) loss 0.3169 (1.1801) lr 1.7705e-03 eta 1 day, 14:05:11
epoch [17/50] batch [800/2000] time 2.063 (2.040) data 0.000 (0.001) loss 2.0397 (1.1759) lr 1.7705e-03 eta 1 day, 14:04:29
epoch [17/50] batch [820/2000] time 2.007 (2.040) data 0.000 (0.001) loss 0.4840 (1.1733) lr 1.7705e-03 eta 1 day, 14:03:42
epoch [17/50] batch [840/2000] time 2.040 (2.040) data 0.000 (0.001) loss 2.5659 (1.1715) lr 1.7705e-03 eta 1 day, 14:02:56
epoch [17/50] batch [860/2000] time 2.006 (2.040) data 0.000 (0.001) loss 0.7165 (1.1776) lr 1.7705e-03 eta 1 day, 14:02:14
epoch [17/50] batch [880/2000] time 2.061 (2.039) data 0.000 (0.001) loss 0.2084 (1.1773) lr 1.7705e-03 eta 1 day, 14:01:24
epoch [17/50] batch [900/2000] time 2.012 (2.039) data 0.000 (0.001) loss 0.6969 (1.1730) lr 1.7705e-03 eta 1 day, 14:00:36
epoch [17/50] batch [920/2000] time 2.061 (2.039) data 0.000 (0.001) loss 1.5046 (1.1732) lr 1.7705e-03 eta 1 day, 13:59:55
epoch [17/50] batch [940/2000] time 2.037 (2.039) data 0.000 (0.001) loss 1.6595 (1.1789) lr 1.7705e-03 eta 1 day, 13:59:21
epoch [17/50] batch [960/2000] time 2.009 (2.039) data 0.000 (0.001) loss 1.6199 (1.1751) lr 1.7705e-03 eta 1 day, 13:58:43
epoch [17/50] batch [980/2000] time 2.062 (2.040) data 0.000 (0.001) loss 1.4223 (1.1814) lr 1.7705e-03 eta 1 day, 13:58:07
epoch [17/50] batch [1000/2000] time 2.044 (2.039) data 0.000 (0.001) loss 1.0179 (1.1801) lr 1.7705e-03 eta 1 day, 13:57:20
epoch [17/50] batch [1020/2000] time 2.075 (2.039) data 0.000 (0.001) loss 1.0279 (1.1777) lr 1.7705e-03 eta 1 day, 13:56:31
epoch [17/50] batch [1040/2000] time 2.013 (2.039) data 0.000 (0.001) loss 0.2134 (1.1801) lr 1.7705e-03 eta 1 day, 13:55:53
epoch [17/50] batch [1060/2000] time 2.057 (2.039) data 0.000 (0.001) loss 0.3589 (1.1782) lr 1.7705e-03 eta 1 day, 13:55:12
epoch [17/50] batch [1080/2000] time 2.038 (2.039) data 0.000 (0.001) loss 1.0505 (1.1771) lr 1.7705e-03 eta 1 day, 13:54:30
epoch [17/50] batch [1100/2000] time 2.079 (2.039) data 0.000 (0.001) loss 0.3953 (1.1694) lr 1.7705e-03 eta 1 day, 13:53:58
epoch [17/50] batch [1120/2000] time 2.041 (2.039) data 0.000 (0.001) loss 1.2169 (1.1720) lr 1.7705e-03 eta 1 day, 13:53:13
epoch [17/50] batch [1140/2000] time 2.039 (2.039) data 0.001 (0.001) loss 1.0607 (1.1729) lr 1.7705e-03 eta 1 day, 13:52:35
epoch [17/50] batch [1160/2000] time 2.007 (2.039) data 0.000 (0.001) loss 0.3703 (1.1738) lr 1.7705e-03 eta 1 day, 13:51:55
epoch [17/50] batch [1180/2000] time 1.989 (2.039) data 0.000 (0.001) loss 3.4461 (1.1766) lr 1.7705e-03 eta 1 day, 13:51:11
epoch [17/50] batch [1200/2000] time 2.007 (2.040) data 0.000 (0.001) loss 2.3183 (1.1764) lr 1.7705e-03 eta 1 day, 13:50:42
epoch [17/50] batch [1220/2000] time 2.032 (2.040) data 0.000 (0.001) loss 2.5491 (1.1744) lr 1.7705e-03 eta 1 day, 13:49:59
epoch [17/50] batch [1240/2000] time 2.060 (2.039) data 0.000 (0.001) loss 0.9054 (1.1770) lr 1.7705e-03 eta 1 day, 13:49:13
epoch [17/50] batch [1260/2000] time 2.057 (2.039) data 0.000 (0.001) loss 0.8674 (1.1823) lr 1.7705e-03 eta 1 day, 13:48:27
epoch [17/50] batch [1280/2000] time 2.035 (2.039) data 0.000 (0.001) loss 1.4849 (1.1865) lr 1.7705e-03 eta 1 day, 13:47:44
epoch [17/50] batch [1300/2000] time 2.005 (2.039) data 0.000 (0.001) loss 1.4216 (1.1875) lr 1.7705e-03 eta 1 day, 13:46:55
epoch [17/50] batch [1320/2000] time 2.058 (2.039) data 0.000 (0.001) loss 0.4769 (1.1879) lr 1.7705e-03 eta 1 day, 13:46:13
epoch [17/50] batch [1340/2000] time 2.058 (2.039) data 0.000 (0.001) loss 0.2315 (1.1905) lr 1.7705e-03 eta 1 day, 13:45:36
epoch [17/50] batch [1360/2000] time 2.061 (2.039) data 0.000 (0.001) loss 0.1366 (1.1939) lr 1.7705e-03 eta 1 day, 13:44:44
epoch [17/50] batch [1380/2000] time 2.034 (2.039) data 0.000 (0.001) loss 0.4156 (1.1937) lr 1.7705e-03 eta 1 day, 13:43:57
epoch [17/50] batch [1400/2000] time 2.057 (2.039) data 0.000 (0.001) loss 1.0817 (1.1910) lr 1.7705e-03 eta 1 day, 13:43:15
epoch [17/50] batch [1420/2000] time 2.034 (2.039) data 0.000 (0.001) loss 0.4063 (1.1881) lr 1.7705e-03 eta 1 day, 13:42:30
epoch [17/50] batch [1440/2000] time 2.003 (2.039) data 0.000 (0.001) loss 1.2017 (1.1828) lr 1.7705e-03 eta 1 day, 13:41:52
epoch [17/50] batch [1460/2000] time 2.034 (2.039) data 0.000 (0.001) loss 0.4774 (1.1859) lr 1.7705e-03 eta 1 day, 13:41:17
epoch [17/50] batch [1480/2000] time 2.008 (2.039) data 0.000 (0.001) loss 1.3207 (1.1894) lr 1.7705e-03 eta 1 day, 13:40:35
epoch [17/50] batch [1500/2000] time 2.035 (2.039) data 0.000 (0.001) loss 1.4395 (1.1865) lr 1.7705e-03 eta 1 day, 13:39:54
epoch [17/50] batch [1520/2000] time 2.040 (2.039) data 0.000 (0.001) loss 2.0816 (1.1843) lr 1.7705e-03 eta 1 day, 13:39:17
epoch [17/50] batch [1540/2000] time 2.068 (2.039) data 0.000 (0.001) loss 0.1488 (1.1825) lr 1.7705e-03 eta 1 day, 13:38:41
epoch [17/50] batch [1560/2000] time 2.012 (2.039) data 0.000 (0.001) loss 2.9893 (1.1854) lr 1.7705e-03 eta 1 day, 13:37:58
epoch [17/50] batch [1580/2000] time 2.068 (2.039) data 0.000 (0.001) loss 1.6070 (1.1875) lr 1.7705e-03 eta 1 day, 13:37:25
epoch [17/50] batch [1600/2000] time 2.064 (2.039) data 0.000 (0.001) loss 0.2963 (1.1871) lr 1.7705e-03 eta 1 day, 13:36:44
epoch [17/50] batch [1620/2000] time 2.071 (2.039) data 0.000 (0.001) loss 0.1782 (1.1843) lr 1.7705e-03 eta 1 day, 13:36:09
epoch [17/50] batch [1640/2000] time 2.079 (2.039) data 0.000 (0.001) loss 1.0463 (1.1853) lr 1.7705e-03 eta 1 day, 13:35:38
epoch [17/50] batch [1660/2000] time 2.064 (2.039) data 0.000 (0.001) loss 2.0095 (1.1862) lr 1.7705e-03 eta 1 day, 13:34:58
epoch [17/50] batch [1680/2000] time 2.062 (2.039) data 0.000 (0.001) loss 1.7507 (1.1877) lr 1.7705e-03 eta 1 day, 13:34:13
epoch [17/50] batch [1700/2000] time 2.060 (2.039) data 0.000 (0.001) loss 0.0844 (1.1852) lr 1.7705e-03 eta 1 day, 13:33:35
epoch [17/50] batch [1720/2000] time 2.037 (2.039) data 0.000 (0.001) loss 0.6241 (1.1886) lr 1.7705e-03 eta 1 day, 13:32:51
epoch [17/50] batch [1740/2000] time 2.009 (2.039) data 0.000 (0.001) loss 2.2541 (1.1904) lr 1.7705e-03 eta 1 day, 13:32:04
epoch [17/50] batch [1760/2000] time 1.979 (2.039) data 0.000 (0.001) loss 1.1333 (1.1896) lr 1.7705e-03 eta 1 day, 13:31:21
epoch [17/50] batch [1780/2000] time 2.009 (2.039) data 0.000 (0.001) loss 1.6553 (1.1918) lr 1.7705e-03 eta 1 day, 13:30:41
epoch [17/50] batch [1800/2000] time 2.037 (2.039) data 0.000 (0.001) loss 0.5106 (1.1932) lr 1.7705e-03 eta 1 day, 13:29:59
epoch [17/50] batch [1820/2000] time 2.065 (2.039) data 0.000 (0.001) loss 0.3788 (1.1961) lr 1.7705e-03 eta 1 day, 13:29:17
epoch [17/50] batch [1840/2000] time 2.033 (2.039) data 0.000 (0.001) loss 0.6922 (1.2003) lr 1.7705e-03 eta 1 day, 13:28:33
epoch [17/50] batch [1860/2000] time 2.059 (2.039) data 0.000 (0.001) loss 0.4791 (1.2026) lr 1.7705e-03 eta 1 day, 13:27:51
epoch [17/50] batch [1880/2000] time 2.061 (2.039) data 0.000 (0.001) loss 0.8539 (1.1988) lr 1.7705e-03 eta 1 day, 13:27:09
epoch [17/50] batch [1900/2000] time 2.059 (2.039) data 0.004 (0.001) loss 0.9835 (1.1992) lr 1.7705e-03 eta 1 day, 13:26:32
epoch [17/50] batch [1920/2000] time 2.017 (2.039) data 0.000 (0.001) loss 0.5306 (1.2016) lr 1.7705e-03 eta 1 day, 13:25:55
epoch [17/50] batch [1940/2000] time 2.041 (2.039) data 0.000 (0.001) loss 1.8359 (1.2032) lr 1.7705e-03 eta 1 day, 13:25:23
epoch [17/50] batch [1960/2000] time 2.061 (2.040) data 0.000 (0.001) loss 0.1226 (1.2032) lr 1.7705e-03 eta 1 day, 13:24:49
epoch [17/50] batch [1980/2000] time 2.058 (2.039) data 0.000 (0.001) loss 2.0731 (1.2041) lr 1.7705e-03 eta 1 day, 13:24:07
epoch [17/50] batch [2000/2000] time 2.002 (2.039) data 0.000 (0.001) loss 2.4321 (1.2055) lr 1.7290e-03 eta 1 day, 13:23:18
epoch [18/50] batch [20/2000] time 2.057 (2.064) data 0.000 (0.030) loss 3.6520 (1.2729) lr 1.7290e-03 eta 1 day, 13:49:16
epoch [18/50] batch [40/2000] time 2.070 (2.051) data 0.000 (0.015) loss 1.5795 (1.2370) lr 1.7290e-03 eta 1 day, 13:35:12
epoch [18/50] batch [60/2000] time 2.042 (2.045) data 0.001 (0.010) loss 0.1194 (1.0573) lr 1.7290e-03 eta 1 day, 13:27:45
epoch [18/50] batch [80/2000] time 2.041 (2.045) data 0.000 (0.008) loss 1.7106 (1.0409) lr 1.7290e-03 eta 1 day, 13:27:04
epoch [18/50] batch [100/2000] time 2.016 (2.046) data 0.000 (0.006) loss 2.4383 (1.0813) lr 1.7290e-03 eta 1 day, 13:27:11
epoch [18/50] batch [120/2000] time 2.063 (2.046) data 0.000 (0.005) loss 1.6067 (1.0427) lr 1.7290e-03 eta 1 day, 13:26:05
epoch [18/50] batch [140/2000] time 2.012 (2.045) data 0.000 (0.004) loss 0.9217 (1.0604) lr 1.7290e-03 eta 1 day, 13:24:31
epoch [18/50] batch [160/2000] time 2.011 (2.045) data 0.000 (0.004) loss 1.6859 (1.1376) lr 1.7290e-03 eta 1 day, 13:23:52
epoch [18/50] batch [180/2000] time 2.042 (2.044) data 0.000 (0.004) loss 1.8430 (1.1511) lr 1.7290e-03 eta 1 day, 13:22:37
epoch [18/50] batch [200/2000] time 2.063 (2.044) data 0.000 (0.003) loss 0.4594 (1.1657) lr 1.7290e-03 eta 1 day, 13:21:04
epoch [18/50] batch [220/2000] time 2.014 (2.044) data 0.000 (0.003) loss 2.2499 (1.1667) lr 1.7290e-03 eta 1 day, 13:20:33
epoch [18/50] batch [240/2000] time 2.067 (2.044) data 0.000 (0.003) loss 2.1089 (1.1543) lr 1.7290e-03 eta 1 day, 13:19:58
epoch [18/50] batch [260/2000] time 2.042 (2.044) data 0.000 (0.003) loss 2.6114 (1.1419) lr 1.7290e-03 eta 1 day, 13:19:45
epoch [18/50] batch [280/2000] time 2.015 (2.044) data 0.000 (0.002) loss 2.2124 (1.1437) lr 1.7290e-03 eta 1 day, 13:19:04
epoch [18/50] batch [300/2000] time 2.063 (2.044) data 0.000 (0.002) loss 0.6656 (1.1661) lr 1.7290e-03 eta 1 day, 13:18:35
epoch [18/50] batch [320/2000] time 2.037 (2.045) data 0.000 (0.002) loss 1.8388 (1.1623) lr 1.7290e-03 eta 1 day, 13:18:16
epoch [18/50] batch [340/2000] time 2.059 (2.044) data 0.000 (0.002) loss 0.7822 (1.1442) lr 1.7290e-03 eta 1 day, 13:17:16
epoch [18/50] batch [360/2000] time 2.017 (2.044) data 0.000 (0.002) loss 2.0184 (1.1455) lr 1.7290e-03 eta 1 day, 13:16:17
epoch [18/50] batch [380/2000] time 2.043 (2.044) data 0.000 (0.002) loss 2.2274 (1.1570) lr 1.7290e-03 eta 1 day, 13:15:11
epoch [18/50] batch [400/2000] time 2.064 (2.043) data 0.000 (0.002) loss 1.0865 (1.1561) lr 1.7290e-03 eta 1 day, 13:14:10
epoch [18/50] batch [420/2000] time 2.011 (2.043) data 0.000 (0.002) loss 0.7149 (1.1642) lr 1.7290e-03 eta 1 day, 13:13:31
epoch [18/50] batch [440/2000] time 2.063 (2.043) data 0.000 (0.002) loss 3.0447 (1.1618) lr 1.7290e-03 eta 1 day, 13:12:49
epoch [18/50] batch [460/2000] time 2.070 (2.043) data 0.000 (0.002) loss 0.0822 (1.1689) lr 1.7290e-03 eta 1 day, 13:11:59
epoch [18/50] batch [480/2000] time 2.059 (2.043) data 0.000 (0.001) loss 0.2838 (1.1708) lr 1.7290e-03 eta 1 day, 13:11:29
epoch [18/50] batch [500/2000] time 2.051 (2.043) data 0.000 (0.001) loss 0.2488 (1.1676) lr 1.7290e-03 eta 1 day, 13:10:09
epoch [18/50] batch [520/2000] time 2.055 (2.042) data 0.000 (0.001) loss 0.5463 (1.1649) lr 1.7290e-03 eta 1 day, 13:08:49
epoch [18/50] batch [540/2000] time 2.057 (2.042) data 0.000 (0.001) loss 1.1797 (1.1657) lr 1.7290e-03 eta 1 day, 13:07:46
epoch [18/50] batch [560/2000] time 2.055 (2.042) data 0.000 (0.001) loss 0.1527 (1.1759) lr 1.7290e-03 eta 1 day, 13:06:52
epoch [18/50] batch [580/2000] time 2.039 (2.042) data 0.000 (0.001) loss 1.0887 (1.1862) lr 1.7290e-03 eta 1 day, 13:06:05
epoch [18/50] batch [600/2000] time 2.056 (2.042) data 0.001 (0.001) loss 0.5286 (1.1818) lr 1.7290e-03 eta 1 day, 13:05:16
epoch [18/50] batch [620/2000] time 2.056 (2.041) data 0.000 (0.001) loss 0.1209 (1.1801) lr 1.7290e-03 eta 1 day, 13:04:22
epoch [18/50] batch [640/2000] time 2.056 (2.042) data 0.000 (0.001) loss 1.9539 (1.1826) lr 1.7290e-03 eta 1 day, 13:03:54
epoch [18/50] batch [660/2000] time 2.001 (2.041) data 0.000 (0.001) loss 0.5662 (1.1761) lr 1.7290e-03 eta 1 day, 13:03:03
epoch [18/50] batch [680/2000] time 2.057 (2.041) data 0.000 (0.001) loss 1.8982 (1.1836) lr 1.7290e-03 eta 1 day, 13:02:10
epoch [18/50] batch [700/2000] time 2.057 (2.041) data 0.000 (0.001) loss 2.3399 (1.1814) lr 1.7290e-03 eta 1 day, 13:01:09
epoch [18/50] batch [720/2000] time 2.032 (2.041) data 0.000 (0.001) loss 4.1557 (1.1755) lr 1.7290e-03 eta 1 day, 13:00:37
epoch [18/50] batch [740/2000] time 1.997 (2.041) data 0.000 (0.001) loss 1.0557 (1.1713) lr 1.7290e-03 eta 1 day, 12:59:42
epoch [18/50] batch [760/2000] time 2.064 (2.041) data 0.000 (0.001) loss 1.0242 (1.1755) lr 1.7290e-03 eta 1 day, 12:58:47
epoch [18/50] batch [780/2000] time 2.040 (2.040) data 0.000 (0.001) loss 0.9116 (1.1678) lr 1.7290e-03 eta 1 day, 12:57:54
epoch [18/50] batch [800/2000] time 2.010 (2.041) data 0.000 (0.001) loss 1.9871 (1.1615) lr 1.7290e-03 eta 1 day, 12:57:29
epoch [18/50] batch [820/2000] time 2.037 (2.041) data 0.000 (0.001) loss 1.4189 (1.1641) lr 1.7290e-03 eta 1 day, 12:56:52
epoch [18/50] batch [840/2000] time 2.057 (2.041) data 0.000 (0.001) loss 0.2176 (1.1639) lr 1.7290e-03 eta 1 day, 12:56:03
epoch [18/50] batch [860/2000] time 2.059 (2.040) data 0.000 (0.001) loss 0.3144 (1.1629) lr 1.7290e-03 eta 1 day, 12:55:15
epoch [18/50] batch [880/2000] time 2.059 (2.040) data 0.000 (0.001) loss 2.6014 (1.1624) lr 1.7290e-03 eta 1 day, 12:54:25
epoch [18/50] batch [900/2000] time 2.057 (2.040) data 0.000 (0.001) loss 1.4678 (1.1639) lr 1.7290e-03 eta 1 day, 12:53:29
epoch [18/50] batch [920/2000] time 2.040 (2.040) data 0.000 (0.001) loss 1.6568 (1.1707) lr 1.7290e-03 eta 1 day, 12:52:40
epoch [18/50] batch [940/2000] time 2.046 (2.040) data 0.000 (0.001) loss 0.4511 (1.1727) lr 1.7290e-03 eta 1 day, 12:52:12
epoch [18/50] batch [960/2000] time 2.041 (2.040) data 0.000 (0.001) loss 0.2238 (1.1708) lr 1.7290e-03 eta 1 day, 12:51:28
epoch [18/50] batch [980/2000] time 2.011 (2.040) data 0.000 (0.001) loss 1.4176 (1.1701) lr 1.7290e-03 eta 1 day, 12:50:49
epoch [18/50] batch [1000/2000] time 2.014 (2.040) data 0.000 (0.001) loss 2.9998 (1.1746) lr 1.7290e-03 eta 1 day, 12:50:16
epoch [18/50] batch [1020/2000] time 1.988 (2.040) data 0.000 (0.001) loss 3.8930 (1.1837) lr 1.7290e-03 eta 1 day, 12:49:30
epoch [18/50] batch [1040/2000] time 2.036 (2.040) data 0.000 (0.001) loss 0.2684 (1.1901) lr 1.7290e-03 eta 1 day, 12:48:46
epoch [18/50] batch [1060/2000] time 2.033 (2.040) data 0.000 (0.001) loss 1.4839 (1.1908) lr 1.7290e-03 eta 1 day, 12:48:03
epoch [18/50] batch [1080/2000] time 2.031 (2.040) data 0.000 (0.001) loss 1.0212 (1.1881) lr 1.7290e-03 eta 1 day, 12:47:15
epoch [18/50] batch [1100/2000] time 2.009 (2.040) data 0.000 (0.001) loss 0.0710 (1.1794) lr 1.7290e-03 eta 1 day, 12:46:30
epoch [18/50] batch [1120/2000] time 2.071 (2.040) data 0.000 (0.001) loss 0.3083 (1.1807) lr 1.7290e-03 eta 1 day, 12:45:59
epoch [18/50] batch [1140/2000] time 2.041 (2.040) data 0.001 (0.001) loss 2.1502 (1.1835) lr 1.7290e-03 eta 1 day, 12:45:26
epoch [18/50] batch [1160/2000] time 2.053 (2.040) data 0.000 (0.001) loss 0.0970 (1.1843) lr 1.7290e-03 eta 1 day, 12:44:54
epoch [18/50] batch [1180/2000] time 2.010 (2.040) data 0.000 (0.001) loss 2.0860 (1.1867) lr 1.7290e-03 eta 1 day, 12:44:06
epoch [18/50] batch [1200/2000] time 2.008 (2.040) data 0.000 (0.001) loss 3.1340 (1.1855) lr 1.7290e-03 eta 1 day, 12:43:21
epoch [18/50] batch [1220/2000] time 2.042 (2.040) data 0.000 (0.001) loss 0.5313 (1.1822) lr 1.7290e-03 eta 1 day, 12:42:41
epoch [18/50] batch [1240/2000] time 2.062 (2.040) data 0.000 (0.001) loss 0.4718 (1.1739) lr 1.7290e-03 eta 1 day, 12:42:04
epoch [18/50] batch [1260/2000] time 2.058 (2.040) data 0.000 (0.001) loss 1.2326 (1.1746) lr 1.7290e-03 eta 1 day, 12:41:20
epoch [18/50] batch [1280/2000] time 2.055 (2.040) data 0.000 (0.001) loss 0.3948 (1.1771) lr 1.7290e-03 eta 1 day, 12:40:38
epoch [18/50] batch [1300/2000] time 2.034 (2.040) data 0.000 (0.001) loss 2.0882 (1.1812) lr 1.7290e-03 eta 1 day, 12:39:53
epoch [18/50] batch [1320/2000] time 2.033 (2.040) data 0.000 (0.001) loss 1.5959 (1.1851) lr 1.7290e-03 eta 1 day, 12:39:00
epoch [18/50] batch [1340/2000] time 2.060 (2.040) data 0.000 (0.001) loss 0.4933 (1.1849) lr 1.7290e-03 eta 1 day, 12:38:19
epoch [18/50] batch [1360/2000] time 2.058 (2.040) data 0.000 (0.001) loss 0.8995 (1.1823) lr 1.7290e-03 eta 1 day, 12:37:34
epoch [18/50] batch [1380/2000] time 2.003 (2.040) data 0.000 (0.001) loss 3.9715 (1.1813) lr 1.7290e-03 eta 1 day, 12:36:52
epoch [18/50] batch [1400/2000] time 1.981 (2.040) data 0.000 (0.001) loss 0.2046 (1.1796) lr 1.7290e-03 eta 1 day, 12:36:05
epoch [18/50] batch [1420/2000] time 2.037 (2.040) data 0.000 (0.001) loss 0.0266 (1.1812) lr 1.7290e-03 eta 1 day, 12:35:18
epoch [18/50] batch [1440/2000] time 2.033 (2.040) data 0.000 (0.001) loss 1.0985 (1.1843) lr 1.7290e-03 eta 1 day, 12:34:31
epoch [18/50] batch [1460/2000] time 2.040 (2.040) data 0.000 (0.001) loss 2.8824 (1.1848) lr 1.7290e-03 eta 1 day, 12:34:01
epoch [18/50] batch [1480/2000] time 2.041 (2.040) data 0.000 (0.001) loss 2.6589 (1.1838) lr 1.7290e-03 eta 1 day, 12:33:18
epoch [18/50] batch [1500/2000] time 2.007 (2.040) data 0.000 (0.001) loss 0.5888 (1.1845) lr 1.7290e-03 eta 1 day, 12:32:33
epoch [18/50] batch [1520/2000] time 2.007 (2.040) data 0.000 (0.001) loss 1.8051 (1.1881) lr 1.7290e-03 eta 1 day, 12:31:52
epoch [18/50] batch [1540/2000] time 1.983 (2.040) data 0.000 (0.001) loss 0.1220 (1.1880) lr 1.7290e-03 eta 1 day, 12:31:12
epoch [18/50] batch [1560/2000] time 2.064 (2.040) data 0.000 (0.001) loss 1.4466 (1.1885) lr 1.7290e-03 eta 1 day, 12:30:34
epoch [18/50] batch [1580/2000] time 2.038 (2.040) data 0.000 (0.001) loss 1.9560 (1.1898) lr 1.7290e-03 eta 1 day, 12:29:55
epoch [18/50] batch [1600/2000] time 2.008 (2.040) data 0.000 (0.001) loss 0.2164 (1.1864) lr 1.7290e-03 eta 1 day, 12:29:18
epoch [18/50] batch [1620/2000] time 2.061 (2.040) data 0.000 (0.001) loss 0.4728 (1.1866) lr 1.7290e-03 eta 1 day, 12:28:39
epoch [18/50] batch [1640/2000] time 2.063 (2.040) data 0.000 (0.001) loss 0.2127 (1.1853) lr 1.7290e-03 eta 1 day, 12:27:59
epoch [18/50] batch [1660/2000] time 2.012 (2.040) data 0.000 (0.001) loss 1.8861 (1.1856) lr 1.7290e-03 eta 1 day, 12:27:18
epoch [18/50] batch [1680/2000] time 2.081 (2.040) data 0.001 (0.001) loss 4.5196 (1.1903) lr 1.7290e-03 eta 1 day, 12:26:41
epoch [18/50] batch [1700/2000] time 2.021 (2.040) data 0.000 (0.001) loss 1.5191 (1.1959) lr 1.7290e-03 eta 1 day, 12:26:11
epoch [18/50] batch [1720/2000] time 2.079 (2.040) data 0.000 (0.001) loss 0.4229 (1.1951) lr 1.7290e-03 eta 1 day, 12:25:35
epoch [18/50] batch [1740/2000] time 2.011 (2.040) data 0.000 (0.001) loss 1.9968 (1.2007) lr 1.7290e-03 eta 1 day, 12:24:57
epoch [18/50] batch [1760/2000] time 2.042 (2.040) data 0.000 (0.001) loss 0.1821 (1.2011) lr 1.7290e-03 eta 1 day, 12:24:15
epoch [18/50] batch [1780/2000] time 2.010 (2.040) data 0.000 (0.001) loss 0.4860 (1.2012) lr 1.7290e-03 eta 1 day, 12:23:37
epoch [18/50] batch [1800/2000] time 2.060 (2.040) data 0.000 (0.001) loss 0.4894 (1.2017) lr 1.7290e-03 eta 1 day, 12:22:59
epoch [18/50] batch [1820/2000] time 2.049 (2.040) data 0.000 (0.001) loss 0.1141 (1.2016) lr 1.7290e-03 eta 1 day, 12:22:18
epoch [18/50] batch [1840/2000] time 2.018 (2.040) data 0.000 (0.001) loss 2.1731 (1.2030) lr 1.7290e-03 eta 1 day, 12:21:34
epoch [18/50] batch [1860/2000] time 2.013 (2.040) data 0.000 (0.001) loss 2.1227 (1.2033) lr 1.7290e-03 eta 1 day, 12:20:57
epoch [18/50] batch [1880/2000] time 2.020 (2.040) data 0.000 (0.001) loss 1.8908 (1.2054) lr 1.7290e-03 eta 1 day, 12:20:14
epoch [18/50] batch [1900/2000] time 2.013 (2.040) data 0.000 (0.001) loss 4.6766 (1.2062) lr 1.7290e-03 eta 1 day, 12:19:40
epoch [18/50] batch [1920/2000] time 2.044 (2.040) data 0.000 (0.001) loss 0.8395 (1.2084) lr 1.7290e-03 eta 1 day, 12:19:02
epoch [18/50] batch [1940/2000] time 2.041 (2.040) data 0.000 (0.001) loss 1.9306 (1.2087) lr 1.7290e-03 eta 1 day, 12:18:26
epoch [18/50] batch [1960/2000] time 2.065 (2.040) data 0.000 (0.001) loss 0.9939 (1.2109) lr 1.7290e-03 eta 1 day, 12:17:45
epoch [18/50] batch [1980/2000] time 2.064 (2.040) data 0.000 (0.001) loss 0.5075 (1.2105) lr 1.7290e-03 eta 1 day, 12:17:09
epoch [18/50] batch [2000/2000] time 2.041 (2.040) data 0.000 (0.001) loss 3.0715 (1.2086) lr 1.6845e-03 eta 1 day, 12:16:29
epoch [19/50] batch [20/2000] time 2.016 (2.075) data 0.000 (0.029) loss 2.8624 (1.5023) lr 1.6845e-03 eta 1 day, 12:52:49
epoch [19/50] batch [40/2000] time 2.067 (2.060) data 0.000 (0.015) loss 1.6245 (1.2423) lr 1.6845e-03 eta 1 day, 12:35:56
epoch [19/50] batch [60/2000] time 2.011 (2.055) data 0.001 (0.010) loss 1.5945 (1.3372) lr 1.6845e-03 eta 1 day, 12:30:12
epoch [19/50] batch [80/2000] time 2.042 (2.051) data 0.000 (0.008) loss 1.3089 (1.2320) lr 1.6845e-03 eta 1 day, 12:25:29
epoch [19/50] batch [100/2000] time 2.012 (2.050) data 0.000 (0.006) loss 0.7205 (1.2613) lr 1.6845e-03 eta 1 day, 12:23:07
epoch [19/50] batch [120/2000] time 2.072 (2.050) data 0.000 (0.005) loss 2.1124 (1.2350) lr 1.6845e-03 eta 1 day, 12:22:02
epoch [19/50] batch [140/2000] time 2.016 (2.049) data 0.000 (0.004) loss 2.7013 (1.2715) lr 1.6845e-03 eta 1 day, 12:21:20
epoch [19/50] batch [160/2000] time 2.006 (2.049) data 0.000 (0.004) loss 0.1410 (1.2336) lr 1.6845e-03 eta 1 day, 12:19:37
epoch [19/50] batch [180/2000] time 2.062 (2.047) data 0.000 (0.003) loss 1.6227 (1.2149) lr 1.6845e-03 eta 1 day, 12:17:49
epoch [19/50] batch [200/2000] time 1.982 (2.046) data 0.000 (0.003) loss 1.0290 (1.2612) lr 1.6845e-03 eta 1 day, 12:15:22
epoch [19/50] batch [220/2000] time 2.555 (2.130) data 0.000 (0.003) loss 0.2444 (1.2613) lr 1.6845e-03 eta 1 day, 13:44:40
epoch [19/50] batch [240/2000] time 2.207 (2.135) data 0.000 (0.003) loss 2.0620 (1.2801) lr 1.6845e-03 eta 1 day, 13:49:13
epoch [19/50] batch [260/2000] time 2.121 (2.146) data 0.000 (0.002) loss 0.2592 (1.2852) lr 1.6845e-03 eta 1 day, 14:00:07
epoch [19/50] batch [280/2000] time 2.544 (2.172) data 0.000 (0.002) loss 1.0813 (1.2760) lr 1.6845e-03 eta 1 day, 14:26:27
epoch [19/50] batch [300/2000] time 2.626 (2.182) data 0.000 (0.002) loss 1.2748 (1.2821) lr 1.6845e-03 eta 1 day, 14:36:54
epoch [19/50] batch [320/2000] time 2.039 (2.214) data 0.000 (0.002) loss 0.2038 (1.2756) lr 1.6845e-03 eta 1 day, 15:10:18
epoch [19/50] batch [340/2000] time 2.062 (2.228) data 0.002 (0.002) loss 1.6909 (1.2886) lr 1.6845e-03 eta 1 day, 15:24:21
epoch [19/50] batch [360/2000] time 2.329 (2.225) data 0.000 (0.002) loss 1.5803 (1.2807) lr 1.6845e-03 eta 1 day, 15:20:18
epoch [19/50] batch [380/2000] time 4.397 (2.336) data 0.000 (0.002) loss 0.2434 (1.2595) lr 1.6845e-03 eta 1 day, 17:17:24
epoch [19/50] batch [400/2000] time 2.298 (2.395) data 0.000 (0.002) loss 0.2855 (1.2622) lr 1.6845e-03 eta 1 day, 18:19:09
epoch [19/50] batch [420/2000] time 2.407 (2.424) data 0.000 (0.002) loss 3.7733 (1.2733) lr 1.6845e-03 eta 1 day, 18:49:04
epoch [19/50] batch [440/2000] time 2.068 (2.417) data 0.000 (0.002) loss 0.3123 (1.2773) lr 1.6845e-03 eta 1 day, 18:40:41
epoch [19/50] batch [460/2000] time 3.417 (2.422) data 0.000 (0.002) loss 0.6794 (1.2797) lr 1.6845e-03 eta 1 day, 18:44:23
epoch [19/50] batch [480/2000] time 2.317 (2.412) data 0.000 (0.002) loss 2.8738 (1.2801) lr 1.6845e-03 eta 1 day, 18:33:58
epoch [19/50] batch [500/2000] time 3.299 (2.431) data 0.000 (0.002) loss 1.3187 (1.2872) lr 1.6845e-03 eta 1 day, 18:52:20
epoch [19/50] batch [520/2000] time 2.058 (2.431) data 0.000 (0.002) loss 2.4301 (1.2910) lr 1.6845e-03 eta 1 day, 18:51:51
epoch [19/50] batch [540/2000] time 2.007 (2.425) data 0.000 (0.002) loss 0.3112 (1.2853) lr 1.6845e-03 eta 1 day, 18:45:20
epoch [19/50] batch [560/2000] time 4.449 (2.454) data 0.000 (0.002) loss 1.9403 (1.2906) lr 1.6845e-03 eta 1 day, 19:14:28
epoch [19/50] batch [580/2000] time 4.428 (2.522) data 0.000 (0.001) loss 0.4876 (1.2787) lr 1.6845e-03 eta 1 day, 20:26:04
epoch [19/50] batch [600/2000] time 4.277 (2.539) data 0.001 (0.001) loss 0.0141 (1.2721) lr 1.6845e-03 eta 1 day, 20:43:19
epoch [19/50] batch [620/2000] time 2.346 (2.533) data 0.000 (0.001) loss 0.2716 (1.2676) lr 1.6845e-03 eta 1 day, 20:35:52
epoch [19/50] batch [640/2000] time 2.020 (2.525) data 0.000 (0.001) loss 0.2115 (1.2659) lr 1.6845e-03 eta 1 day, 20:26:41
epoch [19/50] batch [660/2000] time 3.039 (2.523) data 0.000 (0.001) loss 1.0683 (1.2554) lr 1.6845e-03 eta 1 day, 20:23:32
epoch [19/50] batch [680/2000] time 2.307 (2.524) data 0.014 (0.001) loss 0.6260 (1.2590) lr 1.6845e-03 eta 1 day, 20:23:46
epoch [19/50] batch [700/2000] time 2.370 (2.526) data 0.000 (0.001) loss 1.3866 (1.2443) lr 1.6845e-03 eta 1 day, 20:24:41
epoch [19/50] batch [720/2000] time 2.019 (2.523) data 0.000 (0.001) loss 0.7535 (1.2407) lr 1.6845e-03 eta 1 day, 20:20:24
epoch [19/50] batch [740/2000] time 4.493 (2.524) data 0.000 (0.001) loss 0.7245 (1.2376) lr 1.6845e-03 eta 1 day, 20:21:39
epoch [19/50] batch [760/2000] time 4.508 (2.576) data 0.000 (0.001) loss 0.0503 (1.2277) lr 1.6845e-03 eta 1 day, 21:14:49
epoch [19/50] batch [780/2000] time 2.066 (2.586) data 0.000 (0.001) loss 0.4334 (1.2229) lr 1.6845e-03 eta 1 day, 21:24:28
epoch [19/50] batch [800/2000] time 1.990 (2.572) data 0.000 (0.001) loss 0.9082 (1.2163) lr 1.6845e-03 eta 1 day, 21:09:21
epoch [19/50] batch [820/2000] time 2.060 (2.559) data 0.000 (0.001) loss 0.9871 (1.2132) lr 1.6845e-03 eta 1 day, 20:54:41
epoch [19/50] batch [840/2000] time 2.037 (2.547) data 0.000 (0.001) loss 0.6900 (1.2045) lr 1.6845e-03 eta 1 day, 20:40:52
epoch [19/50] batch [860/2000] time 2.056 (2.535) data 0.000 (0.001) loss 1.7359 (1.2070) lr 1.6845e-03 eta 1 day, 20:27:32
epoch [19/50] batch [880/2000] time 2.004 (2.524) data 0.000 (0.001) loss 0.3727 (1.2150) lr 1.6845e-03 eta 1 day, 20:14:51
epoch [19/50] batch [900/2000] time 2.060 (2.513) data 0.000 (0.001) loss 0.5184 (1.2141) lr 1.6845e-03 eta 1 day, 20:02:41
epoch [19/50] batch [920/2000] time 2.063 (2.503) data 0.000 (0.001) loss 0.7540 (1.2115) lr 1.6845e-03 eta 1 day, 19:51:16
epoch [19/50] batch [940/2000] time 2.039 (2.493) data 0.000 (0.001) loss 0.8096 (1.2085) lr 1.6845e-03 eta 1 day, 19:40:00
epoch [19/50] batch [960/2000] time 2.055 (2.484) data 0.000 (0.001) loss 1.7759 (1.2041) lr 1.6845e-03 eta 1 day, 19:29:22
epoch [19/50] batch [980/2000] time 2.070 (2.475) data 0.000 (0.001) loss 2.4083 (1.2055) lr 1.6845e-03 eta 1 day, 19:19:10
epoch [19/50] batch [1000/2000] time 2.010 (2.466) data 0.000 (0.001) loss 1.1510 (1.2076) lr 1.6845e-03 eta 1 day, 19:09:08
epoch [19/50] batch [1020/2000] time 2.069 (2.458) data 0.000 (0.001) loss 1.0140 (1.2032) lr 1.6845e-03 eta 1 day, 18:59:45
epoch [19/50] batch [1040/2000] time 2.037 (2.450) data 0.000 (0.001) loss 0.5345 (1.2061) lr 1.6845e-03 eta 1 day, 18:50:41
epoch [19/50] batch [1060/2000] time 2.020 (2.442) data 0.000 (0.001) loss 1.6637 (1.2091) lr 1.6845e-03 eta 1 day, 18:41:43
epoch [19/50] batch [1080/2000] time 2.011 (2.435) data 0.000 (0.001) loss 1.1292 (1.2043) lr 1.6845e-03 eta 1 day, 18:33:07
epoch [19/50] batch [1100/2000] time 2.040 (2.427) data 0.000 (0.001) loss 0.3178 (1.2052) lr 1.6845e-03 eta 1 day, 18:24:48
epoch [19/50] batch [1120/2000] time 2.008 (2.421) data 0.000 (0.001) loss 3.6588 (1.2053) lr 1.6845e-03 eta 1 day, 18:16:42
epoch [19/50] batch [1140/2000] time 2.010 (2.414) data 0.001 (0.001) loss 0.3333 (1.2062) lr 1.6845e-03 eta 1 day, 18:08:57
epoch [19/50] batch [1160/2000] time 2.047 (2.407) data 0.000 (0.001) loss 1.4708 (1.2011) lr 1.6845e-03 eta 1 day, 18:01:16
epoch [19/50] batch [1180/2000] time 2.073 (2.401) data 0.000 (0.001) loss 0.3890 (1.1972) lr 1.6845e-03 eta 1 day, 17:54:02
epoch [19/50] batch [1200/2000] time 2.043 (2.395) data 0.000 (0.001) loss 1.0144 (1.1969) lr 1.6845e-03 eta 1 day, 17:46:50
epoch [19/50] batch [1220/2000] time 2.065 (2.389) data 0.000 (0.001) loss 1.5939 (1.1986) lr 1.6845e-03 eta 1 day, 17:39:58
epoch [19/50] batch [1240/2000] time 1.993 (2.384) data 0.000 (0.001) loss 0.0088 (1.1943) lr 1.6845e-03 eta 1 day, 17:33:22
epoch [19/50] batch [1260/2000] time 2.008 (2.378) data 0.000 (0.001) loss 3.2661 (1.2003) lr 1.6845e-03 eta 1 day, 17:26:54
epoch [19/50] batch [1280/2000] time 2.074 (2.373) data 0.000 (0.001) loss 0.9648 (1.2051) lr 1.6845e-03 eta 1 day, 17:20:42
epoch [19/50] batch [1300/2000] time 2.024 (2.368) data 0.000 (0.001) loss 1.4108 (1.2021) lr 1.6845e-03 eta 1 day, 17:14:37
epoch [19/50] batch [1320/2000] time 2.013 (2.363) data 0.000 (0.001) loss 0.1354 (1.2011) lr 1.6845e-03 eta 1 day, 17:08:40
epoch [19/50] batch [1340/2000] time 2.042 (2.358) data 0.000 (0.001) loss 0.8242 (1.2021) lr 1.6845e-03 eta 1 day, 17:02:54
epoch [19/50] batch [1360/2000] time 2.041 (2.354) data 0.000 (0.001) loss 0.5760 (1.2021) lr 1.6845e-03 eta 1 day, 16:57:22
epoch [19/50] batch [1380/2000] time 2.040 (2.349) data 0.000 (0.001) loss 2.7093 (1.2049) lr 1.6845e-03 eta 1 day, 16:51:58
epoch [19/50] batch [1400/2000] time 2.042 (2.345) data 0.000 (0.001) loss 1.0957 (1.2063) lr 1.6845e-03 eta 1 day, 16:46:40
epoch [19/50] batch [1420/2000] time 2.062 (2.341) data 0.000 (0.001) loss 2.1092 (1.2105) lr 1.6845e-03 eta 1 day, 16:41:36
epoch [19/50] batch [1440/2000] time 2.062 (2.337) data 0.000 (0.001) loss 0.4464 (1.2086) lr 1.6845e-03 eta 1 day, 16:36:29
epoch [19/50] batch [1460/2000] time 2.064 (2.333) data 0.000 (0.001) loss 2.5625 (1.2043) lr 1.6845e-03 eta 1 day, 16:31:37
epoch [19/50] batch [1480/2000] time 2.041 (2.329) data 0.000 (0.001) loss 1.0019 (1.2064) lr 1.6845e-03 eta 1 day, 16:26:42
epoch [19/50] batch [1500/2000] time 2.067 (2.325) data 0.000 (0.001) loss 1.2104 (1.2109) lr 1.6845e-03 eta 1 day, 16:21:55
epoch [19/50] batch [1520/2000] time 2.009 (2.321) data 0.000 (0.001) loss 1.1452 (1.2088) lr 1.6845e-03 eta 1 day, 16:17:11
epoch [19/50] batch [1540/2000] time 2.063 (2.318) data 0.000 (0.001) loss 0.9558 (1.2074) lr 1.6845e-03 eta 1 day, 16:12:44
epoch [19/50] batch [1560/2000] time 2.069 (2.314) data 0.000 (0.001) loss 0.6215 (1.2105) lr 1.6845e-03 eta 1 day, 16:08:20
epoch [19/50] batch [1580/2000] time 2.063 (2.311) data 0.000 (0.001) loss 2.1547 (1.2105) lr 1.6845e-03 eta 1 day, 16:04:03
epoch [19/50] batch [1600/2000] time 2.013 (2.307) data 0.000 (0.001) loss 0.1577 (1.2119) lr 1.6845e-03 eta 1 day, 15:59:46
epoch [19/50] batch [1620/2000] time 2.051 (2.304) data 0.000 (0.001) loss 0.2403 (1.2164) lr 1.6845e-03 eta 1 day, 15:55:33
epoch [19/50] batch [1640/2000] time 2.014 (2.301) data 0.000 (0.001) loss 1.0100 (1.2132) lr 1.6845e-03 eta 1 day, 15:51:29
epoch [19/50] batch [1660/2000] time 1.996 (2.298) data 0.000 (0.001) loss 0.1134 (1.2149) lr 1.6845e-03 eta 1 day, 15:47:27
epoch [19/50] batch [1680/2000] time 1.990 (2.295) data 0.001 (0.001) loss 0.2452 (1.2135) lr 1.6845e-03 eta 1 day, 15:43:33
epoch [19/50] batch [1700/2000] time 2.070 (2.292) data 0.000 (0.001) loss 1.1712 (1.2108) lr 1.6845e-03 eta 1 day, 15:39:44
epoch [19/50] batch [1720/2000] time 2.039 (2.289) data 0.000 (0.001) loss 0.7348 (1.2107) lr 1.6845e-03 eta 1 day, 15:35:55
epoch [19/50] batch [1740/2000] time 2.040 (2.286) data 0.000 (0.001) loss 3.5666 (1.2131) lr 1.6845e-03 eta 1 day, 15:32:09
epoch [19/50] batch [1760/2000] time 2.066 (2.283) data 0.000 (0.001) loss 0.8756 (1.2102) lr 1.6845e-03 eta 1 day, 15:28:31
epoch [19/50] batch [1780/2000] time 2.068 (2.281) data 0.000 (0.001) loss 1.4714 (1.2122) lr 1.6845e-03 eta 1 day, 15:24:56
epoch [19/50] batch [1800/2000] time 2.054 (2.278) data 0.000 (0.001) loss 0.5991 (1.2095) lr 1.6845e-03 eta 1 day, 15:21:31
epoch [19/50] batch [1820/2000] time 2.040 (2.276) data 0.000 (0.001) loss 1.2004 (1.2153) lr 1.6845e-03 eta 1 day, 15:18:10
epoch [19/50] batch [1840/2000] time 2.066 (2.273) data 0.000 (0.001) loss 0.6344 (1.2147) lr 1.6845e-03 eta 1 day, 15:14:52
epoch [19/50] batch [1860/2000] time 2.065 (2.271) data 0.000 (0.001) loss 0.5382 (1.2160) lr 1.6845e-03 eta 1 day, 15:11:37
epoch [19/50] batch [1880/2000] time 2.021 (2.268) data 0.000 (0.001) loss 1.5268 (1.2160) lr 1.6845e-03 eta 1 day, 15:08:22
epoch [19/50] batch [1900/2000] time 2.018 (2.266) data 0.000 (0.001) loss 0.6571 (1.2155) lr 1.6845e-03 eta 1 day, 15:05:08
epoch [19/50] batch [1920/2000] time 2.036 (2.264) data 0.000 (0.001) loss 1.4496 (1.2157) lr 1.6845e-03 eta 1 day, 15:01:59
epoch [19/50] batch [1940/2000] time 2.036 (2.261) data 0.000 (0.001) loss 0.1186 (1.2164) lr 1.6845e-03 eta 1 day, 14:58:52
epoch [19/50] batch [1960/2000] time 2.049 (2.259) data 0.000 (0.001) loss 1.4138 (1.2199) lr 1.6845e-03 eta 1 day, 14:55:53
epoch [19/50] batch [1980/2000] time 2.039 (2.257) data 0.000 (0.001) loss 0.6909 (1.2168) lr 1.6845e-03 eta 1 day, 14:52:56
epoch [19/50] batch [2000/2000] time 2.060 (2.255) data 0.000 (0.001) loss 0.0846 (1.2188) lr 1.6374e-03 eta 1 day, 14:49:55
epoch [20/50] batch [20/2000] time 2.065 (2.065) data 0.000 (0.030) loss 0.3981 (1.0877) lr 1.6374e-03 eta 1 day, 11:33:23
epoch [20/50] batch [40/2000] time 2.066 (2.058) data 0.000 (0.015) loss 0.2772 (1.1120) lr 1.6374e-03 eta 1 day, 11:25:35
epoch [20/50] batch [60/2000] time 2.068 (2.052) data 0.001 (0.010) loss 0.8696 (1.1994) lr 1.6374e-03 eta 1 day, 11:18:05
epoch [20/50] batch [80/2000] time 2.067 (2.050) data 0.000 (0.008) loss 1.6026 (1.1491) lr 1.6374e-03 eta 1 day, 11:15:08
epoch [20/50] batch [100/2000] time 2.066 (2.097) data 0.001 (0.006) loss 0.3841 (1.1814) lr 1.6374e-03 eta 1 day, 12:03:25
epoch [20/50] batch [120/2000] time 2.061 (2.181) data 0.000 (0.005) loss 0.2341 (1.2052) lr 1.6374e-03 eta 1 day, 13:29:39
epoch [20/50] batch [140/2000] time 4.441 (2.298) data 0.000 (0.005) loss 0.2687 (1.1676) lr 1.6374e-03 eta 1 day, 15:29:38
epoch [20/50] batch [160/2000] time 4.525 (2.428) data 0.000 (0.004) loss 0.2424 (1.1966) lr 1.6374e-03 eta 1 day, 17:42:48
epoch [20/50] batch [180/2000] time 2.068 (2.534) data 0.000 (0.004) loss 0.1334 (1.2001) lr 1.6374e-03 eta 1 day, 19:31:02
epoch [20/50] batch [200/2000] time 2.305 (2.524) data 0.000 (0.003) loss 2.2121 (1.2064) lr 1.6374e-03 eta 1 day, 19:19:51
epoch [20/50] batch [220/2000] time 2.072 (2.506) data 0.000 (0.003) loss 1.2527 (1.2009) lr 1.6374e-03 eta 1 day, 19:00:20
epoch [20/50] batch [240/2000] time 2.611 (2.488) data 0.000 (0.003) loss 1.7575 (1.2283) lr 1.6374e-03 eta 1 day, 18:41:04
epoch [20/50] batch [260/2000] time 2.025 (2.469) data 0.000 (0.003) loss 2.4869 (1.2247) lr 1.6374e-03 eta 1 day, 18:20:46
epoch [20/50] batch [280/2000] time 2.082 (2.454) data 0.000 (0.003) loss 2.5147 (1.2200) lr 1.6374e-03 eta 1 day, 18:04:36
epoch [20/50] batch [300/2000] time 2.169 (2.444) data 0.000 (0.002) loss 0.4205 (1.2280) lr 1.6374e-03 eta 1 day, 17:53:20
epoch [20/50] batch [320/2000] time 2.333 (2.432) data 0.000 (0.002) loss 1.1307 (1.2353) lr 1.6374e-03 eta 1 day, 17:40:00
epoch [20/50] batch [340/2000] time 4.477 (2.470) data 0.000 (0.002) loss 2.8787 (1.2482) lr 1.6374e-03 eta 1 day, 18:18:50
epoch [20/50] batch [360/2000] time 4.431 (2.581) data 0.000 (0.002) loss 5.9010 (1.2652) lr 1.6374e-03 eta 1 day, 20:11:47
epoch [20/50] batch [380/2000] time 2.300 (2.617) data 0.000 (0.002) loss 1.0236 (1.2598) lr 1.6374e-03 eta 1 day, 20:47:27
epoch [20/50] batch [400/2000] time 4.288 (2.642) data 0.000 (0.002) loss 0.3027 (1.2485) lr 1.6374e-03 eta 1 day, 21:12:30
epoch [20/50] batch [420/2000] time 3.305 (2.665) data 0.000 (0.002) loss 0.3297 (1.2320) lr 1.6374e-03 eta 1 day, 21:35:11
epoch [20/50] batch [440/2000] time 4.487 (2.689) data 0.000 (0.002) loss 0.8754 (1.2278) lr 1.6374e-03 eta 1 day, 21:59:17
epoch [20/50] batch [460/2000] time 4.511 (2.767) data 0.000 (0.002) loss 1.7730 (1.2193) lr 1.6374e-03 eta 1 day, 23:17:49
epoch [20/50] batch [480/2000] time 2.057 (2.762) data 0.000 (0.002) loss 0.8897 (1.2175) lr 1.6374e-03 eta 1 day, 23:11:39
epoch [20/50] batch [500/2000] time 2.061 (2.776) data 0.000 (0.002) loss 0.3405 (1.2142) lr 1.6374e-03 eta 1 day, 23:25:36
epoch [20/50] batch [520/2000] time 2.060 (2.748) data 0.000 (0.002) loss 0.6955 (1.2059) lr 1.6374e-03 eta 1 day, 22:55:58
epoch [20/50] batch [540/2000] time 2.056 (2.722) data 0.000 (0.002) loss 0.2163 (1.1901) lr 1.6374e-03 eta 1 day, 22:28:11
epoch [20/50] batch [560/2000] time 2.059 (2.698) data 0.000 (0.001) loss 1.6699 (1.1913) lr 1.6374e-03 eta 1 day, 22:02:17
epoch [20/50] batch [580/2000] time 2.019 (2.675) data 0.000 (0.001) loss 0.2435 (1.1887) lr 1.6374e-03 eta 1 day, 21:37:59
epoch [20/50] batch [600/2000] time 2.070 (2.654) data 0.001 (0.001) loss 0.5557 (1.1855) lr 1.6374e-03 eta 1 day, 21:15:39
epoch [20/50] batch [620/2000] time 2.042 (2.634) data 0.000 (0.001) loss 0.5308 (1.1777) lr 1.6374e-03 eta 1 day, 20:54:33
epoch [20/50] batch [640/2000] time 2.011 (2.616) data 0.000 (0.001) loss 0.3542 (1.1773) lr 1.6374e-03 eta 1 day, 20:34:49
epoch [20/50] batch [660/2000] time 2.069 (2.598) data 0.000 (0.001) loss 2.8223 (1.1753) lr 1.6374e-03 eta 1 day, 20:16:18
epoch [20/50] batch [680/2000] time 2.041 (2.582) data 0.000 (0.001) loss 0.6256 (1.1704) lr 1.6374e-03 eta 1 day, 19:58:46
epoch [20/50] batch [700/2000] time 2.046 (2.567) data 0.005 (0.001) loss 0.2986 (1.1713) lr 1.6374e-03 eta 1 day, 19:42:13
epoch [20/50] batch [720/2000] time 2.039 (2.552) data 0.000 (0.001) loss 1.4265 (1.1707) lr 1.6374e-03 eta 1 day, 19:26:38
epoch [20/50] batch [740/2000] time 2.037 (2.539) data 0.000 (0.001) loss 0.4251 (1.1715) lr 1.6374e-03 eta 1 day, 19:11:53
epoch [20/50] batch [760/2000] time 2.069 (2.525) data 0.000 (0.001) loss 1.6510 (1.1656) lr 1.6374e-03 eta 1 day, 18:57:35
epoch [20/50] batch [780/2000] time 2.010 (2.513) data 0.000 (0.001) loss 0.2229 (1.1712) lr 1.6374e-03 eta 1 day, 18:44:07
epoch [20/50] batch [800/2000] time 2.064 (2.501) data 0.000 (0.001) loss 1.6592 (1.1699) lr 1.6374e-03 eta 1 day, 18:31:24
epoch [20/50] batch [820/2000] time 2.066 (2.490) data 0.000 (0.001) loss 1.7113 (1.1755) lr 1.6374e-03 eta 1 day, 18:19:20
epoch [20/50] batch [840/2000] time 2.063 (2.480) data 0.000 (0.001) loss 0.2692 (1.1735) lr 1.6374e-03 eta 1 day, 18:07:39
epoch [20/50] batch [860/2000] time 2.064 (2.470) data 0.000 (0.001) loss 0.4163 (1.1821) lr 1.6374e-03 eta 1 day, 17:56:34
epoch [20/50] batch [880/2000] time 2.010 (2.460) data 0.000 (0.001) loss 1.6370 (1.1779) lr 1.6374e-03 eta 1 day, 17:45:55
epoch [20/50] batch [900/2000] time 2.047 (2.451) data 0.000 (0.001) loss 0.2830 (1.1860) lr 1.6374e-03 eta 1 day, 17:35:35
epoch [20/50] batch [920/2000] time 2.011 (2.442) data 0.000 (0.001) loss 2.2969 (1.1849) lr 1.6374e-03 eta 1 day, 17:25:48
epoch [20/50] batch [940/2000] time 2.070 (2.433) data 0.000 (0.001) loss 0.2568 (1.1892) lr 1.6374e-03 eta 1 day, 17:16:28
epoch [20/50] batch [960/2000] time 2.042 (2.425) data 0.000 (0.001) loss 1.0292 (1.1880) lr 1.6374e-03 eta 1 day, 17:07:22
epoch [20/50] batch [980/2000] time 2.063 (2.417) data 0.000 (0.001) loss 1.6958 (1.1871) lr 1.6374e-03 eta 1 day, 16:58:35
epoch [20/50] batch [1000/2000] time 2.012 (2.410) data 0.000 (0.001) loss 2.2476 (1.1866) lr 1.6374e-03 eta 1 day, 16:50:11
epoch [20/50] batch [1020/2000] time 2.014 (2.403) data 0.000 (0.001) loss 2.0219 (1.1916) lr 1.6374e-03 eta 1 day, 16:42:06
epoch [20/50] batch [1040/2000] time 2.041 (2.396) data 0.000 (0.001) loss 0.4348 (1.1884) lr 1.6374e-03 eta 1 day, 16:34:10
epoch [20/50] batch [1060/2000] time 1.988 (2.389) data 0.000 (0.001) loss 1.3074 (1.1857) lr 1.6374e-03 eta 1 day, 16:26:33
epoch [20/50] batch [1080/2000] time 2.047 (2.383) data 0.000 (0.001) loss 0.3529 (1.1892) lr 1.6374e-03 eta 1 day, 16:19:16
epoch [20/50] batch [1100/2000] time 2.080 (2.376) data 0.000 (0.001) loss 0.2788 (1.1884) lr 1.6374e-03 eta 1 day, 16:12:07
epoch [20/50] batch [1120/2000] time 2.063 (2.371) data 0.000 (0.001) loss 0.2664 (1.1877) lr 1.6374e-03 eta 1 day, 16:05:22
epoch [20/50] batch [1140/2000] time 2.060 (2.365) data 0.001 (0.001) loss 0.1286 (1.1843) lr 1.6374e-03 eta 1 day, 15:58:49
epoch [20/50] batch [1160/2000] time 2.041 (2.359) data 0.000 (0.001) loss 3.0731 (1.1818) lr 1.6374e-03 eta 1 day, 15:52:27
epoch [20/50] batch [1180/2000] time 2.018 (2.354) data 0.000 (0.001) loss 0.2093 (1.1733) lr 1.6374e-03 eta 1 day, 15:46:21
epoch [20/50] batch [1200/2000] time 2.014 (2.349) data 0.000 (0.001) loss 0.9867 (1.1754) lr 1.6374e-03 eta 1 day, 15:40:25
epoch [20/50] batch [1220/2000] time 2.062 (2.344) data 0.000 (0.001) loss 1.9314 (1.1867) lr 1.6374e-03 eta 1 day, 15:34:40
epoch [20/50] batch [1240/2000] time 2.063 (2.339) data 0.000 (0.001) loss 0.9815 (1.1916) lr 1.6374e-03 eta 1 day, 15:28:55
epoch [20/50] batch [1260/2000] time 1.985 (2.335) data 0.000 (0.001) loss 1.0077 (1.1913) lr 1.6374e-03 eta 1 day, 15:23:23
epoch [20/50] batch [1280/2000] time 2.037 (2.330) data 0.000 (0.001) loss 0.0977 (1.1898) lr 1.6374e-03 eta 1 day, 15:18:05
epoch [20/50] batch [1300/2000] time 2.065 (2.326) data 0.000 (0.001) loss 0.0313 (1.1872) lr 1.6374e-03 eta 1 day, 15:12:50
epoch [20/50] batch [1320/2000] time 2.075 (2.322) data 0.000 (0.001) loss 0.0572 (1.1859) lr 1.6374e-03 eta 1 day, 15:07:49
epoch [20/50] batch [1340/2000] time 2.067 (2.317) data 0.000 (0.001) loss 0.6022 (1.1904) lr 1.6374e-03 eta 1 day, 15:02:52
epoch [20/50] batch [1360/2000] time 2.008 (2.313) data 0.000 (0.001) loss 0.6140 (1.1884) lr 1.6374e-03 eta 1 day, 14:58:00
epoch [20/50] batch [1380/2000] time 2.065 (2.309) data 0.000 (0.001) loss 0.4383 (1.1860) lr 1.6374e-03 eta 1 day, 14:53:19
epoch [20/50] batch [1400/2000] time 2.040 (2.306) data 0.000 (0.001) loss 3.3001 (1.1880) lr 1.6374e-03 eta 1 day, 14:48:42
epoch [20/50] batch [1420/2000] time 2.071 (2.302) data 0.000 (0.001) loss 0.4928 (1.1911) lr 1.6374e-03 eta 1 day, 14:44:16
epoch [20/50] batch [1440/2000] time 1.987 (2.298) data 0.000 (0.001) loss 3.2827 (1.1931) lr 1.6374e-03 eta 1 day, 14:39:53
epoch [20/50] batch [1460/2000] time 2.061 (2.295) data 0.000 (0.001) loss 1.9523 (1.1905) lr 1.6374e-03 eta 1 day, 14:35:35
epoch [20/50] batch [1480/2000] time 2.062 (2.292) data 0.000 (0.001) loss 0.8641 (1.1883) lr 1.6374e-03 eta 1 day, 14:31:28
epoch [20/50] batch [1500/2000] time 2.010 (2.288) data 0.000 (0.001) loss 0.3741 (1.1879) lr 1.6374e-03 eta 1 day, 14:27:26
epoch [20/50] batch [1520/2000] time 2.008 (2.285) data 0.000 (0.001) loss 1.1368 (1.1925) lr 1.6374e-03 eta 1 day, 14:23:29
epoch [20/50] batch [1540/2000] time 2.008 (2.282) data 0.000 (0.001) loss 0.1902 (1.1856) lr 1.6374e-03 eta 1 day, 14:19:35
epoch [20/50] batch [1560/2000] time 2.062 (2.279) data 0.000 (0.001) loss 2.1246 (1.1856) lr 1.6374e-03 eta 1 day, 14:15:44
epoch [20/50] batch [1580/2000] time 2.071 (2.276) data 0.000 (0.001) loss 0.2493 (1.1845) lr 1.6374e-03 eta 1 day, 14:12:01
epoch [20/50] batch [1600/2000] time 2.015 (2.273) data 0.000 (0.001) loss 0.5383 (1.1872) lr 1.6374e-03 eta 1 day, 14:08:19
epoch [20/50] batch [1620/2000] time 2.010 (2.270) data 0.000 (0.001) loss 0.2774 (1.1864) lr 1.6374e-03 eta 1 day, 14:04:40
epoch [20/50] batch [1640/2000] time 2.010 (2.267) data 0.000 (0.001) loss 1.2487 (1.1896) lr 1.6374e-03 eta 1 day, 14:01:03
epoch [20/50] batch [1660/2000] time 2.079 (2.265) data 0.000 (0.001) loss 0.4458 (1.1885) lr 1.6374e-03 eta 1 day, 13:57:32
epoch [20/50] batch [1680/2000] time 2.010 (2.262) data 0.001 (0.001) loss 0.1344 (1.1875) lr 1.6374e-03 eta 1 day, 13:54:03
epoch [20/50] batch [1700/2000] time 2.046 (2.260) data 0.000 (0.001) loss 0.0519 (1.1876) lr 1.6374e-03 eta 1 day, 13:50:48
epoch [20/50] batch [1720/2000] time 2.065 (2.257) data 0.000 (0.001) loss 5.0296 (1.1891) lr 1.6374e-03 eta 1 day, 13:47:36
epoch [20/50] batch [1740/2000] time 2.010 (2.255) data 0.000 (0.001) loss 0.6860 (1.1852) lr 1.6374e-03 eta 1 day, 13:44:25
epoch [20/50] batch [1760/2000] time 2.072 (2.252) data 0.000 (0.001) loss 0.6265 (1.1881) lr 1.6374e-03 eta 1 day, 13:41:17
epoch [20/50] batch [1780/2000] time 2.064 (2.250) data 0.000 (0.001) loss 1.7461 (1.1894) lr 1.6374e-03 eta 1 day, 13:38:16
epoch [20/50] batch [1800/2000] time 2.072 (2.248) data 0.000 (0.001) loss 1.3404 (1.1920) lr 1.6374e-03 eta 1 day, 13:35:18
epoch [20/50] batch [1820/2000] time 2.071 (2.245) data 0.002 (0.001) loss 1.5651 (1.1975) lr 1.6374e-03 eta 1 day, 13:32:13
epoch [20/50] batch [1840/2000] time 2.069 (2.243) data 0.000 (0.001) loss 0.2119 (1.1949) lr 1.6374e-03 eta 1 day, 13:29:11
epoch [20/50] batch [1860/2000] time 2.045 (2.241) data 0.000 (0.001) loss 0.7209 (1.1981) lr 1.6374e-03 eta 1 day, 13:26:16
epoch [20/50] batch [1880/2000] time 2.076 (2.239) data 0.000 (0.001) loss 0.3554 (1.1968) lr 1.6374e-03 eta 1 day, 13:23:26
epoch [20/50] batch [1900/2000] time 2.066 (2.237) data 0.000 (0.001) loss 0.0988 (1.1968) lr 1.6374e-03 eta 1 day, 13:20:44
epoch [20/50] batch [1920/2000] time 2.019 (2.235) data 0.000 (0.001) loss 1.6954 (1.1979) lr 1.6374e-03 eta 1 day, 13:18:01
epoch [20/50] batch [1940/2000] time 2.065 (2.233) data 0.000 (0.001) loss 2.3916 (1.1973) lr 1.6374e-03 eta 1 day, 13:15:21
epoch [20/50] batch [1960/2000] time 2.044 (2.231) data 0.000 (0.001) loss 1.1695 (1.1991) lr 1.6374e-03 eta 1 day, 13:12:38
epoch [20/50] batch [1980/2000] time 2.062 (2.229) data 0.000 (0.001) loss 0.5868 (1.1989) lr 1.6374e-03 eta 1 day, 13:10:03
epoch [20/50] batch [2000/2000] time 2.038 (2.227) data 0.000 (0.001) loss 0.3025 (1.1987) lr 1.5878e-03 eta 1 day, 13:07:27
epoch [21/50] batch [20/2000] time 2.063 (2.072) data 0.000 (0.028) loss 0.7157 (1.2906) lr 1.5878e-03 eta 1 day, 10:31:13
epoch [21/50] batch [40/2000] time 2.080 (2.059) data 0.000 (0.014) loss 1.5410 (1.3255) lr 1.5878e-03 eta 1 day, 10:17:38
epoch [21/50] batch [60/2000] time 2.037 (2.053) data 0.001 (0.009) loss 0.4154 (1.2844) lr 1.5878e-03 eta 1 day, 10:11:07
epoch [21/50] batch [80/2000] time 2.060 (2.050) data 0.000 (0.007) loss 0.0908 (1.2402) lr 1.5878e-03 eta 1 day, 10:07:07
epoch [21/50] batch [100/2000] time 2.011 (2.049) data 0.000 (0.006) loss 1.1729 (1.2114) lr 1.5878e-03 eta 1 day, 10:05:17
epoch [21/50] batch [120/2000] time 2.017 (2.048) data 0.000 (0.005) loss 1.1151 (1.2061) lr 1.5878e-03 eta 1 day, 10:03:31
epoch [21/50] batch [140/2000] time 2.065 (2.048) data 0.000 (0.004) loss 0.4910 (1.2285) lr 1.5878e-03 eta 1 day, 10:02:57
epoch [21/50] batch [160/2000] time 2.009 (2.047) data 0.000 (0.004) loss 1.4340 (1.2709) lr 1.5878e-03 eta 1 day, 10:02:00
epoch [21/50] batch [180/2000] time 2.064 (2.047) data 0.000 (0.003) loss 0.8227 (1.2723) lr 1.5878e-03 eta 1 day, 10:01:09
epoch [21/50] batch [200/2000] time 2.054 (2.047) data 0.000 (0.003) loss 0.3012 (1.2317) lr 1.5878e-03 eta 1 day, 10:00:25
epoch [21/50] batch [220/2000] time 2.069 (2.047) data 0.000 (0.003) loss 0.3904 (1.2093) lr 1.5878e-03 eta 1 day, 9:59:58
epoch [21/50] batch [240/2000] time 2.044 (2.048) data 0.000 (0.003) loss 1.8086 (1.2003) lr 1.5878e-03 eta 1 day, 9:59:27
epoch [21/50] batch [260/2000] time 2.076 (2.047) data 0.000 (0.002) loss 0.7130 (1.1928) lr 1.5878e-03 eta 1 day, 9:58:24
epoch [21/50] batch [280/2000] time 2.017 (2.047) data 0.000 (0.002) loss 0.9205 (1.1782) lr 1.5878e-03 eta 1 day, 9:57:33
epoch [21/50] batch [300/2000] time 1.996 (2.047) data 0.000 (0.002) loss 4.2773 (1.1999) lr 1.5878e-03 eta 1 day, 9:56:21
epoch [21/50] batch [320/2000] time 2.065 (2.047) data 0.000 (0.002) loss 1.4481 (1.2206) lr 1.5878e-03 eta 1 day, 9:55:41
epoch [21/50] batch [340/2000] time 2.072 (2.047) data 0.000 (0.002) loss 0.3512 (1.2088) lr 1.5878e-03 eta 1 day, 9:55:06
epoch [21/50] batch [360/2000] time 2.014 (2.047) data 0.000 (0.002) loss 0.2041 (1.1932) lr 1.5878e-03 eta 1 day, 9:54:16
epoch [21/50] batch [380/2000] time 2.049 (2.047) data 0.000 (0.002) loss 2.2905 (1.1804) lr 1.5878e-03 eta 1 day, 9:53:50
epoch [21/50] batch [400/2000] time 2.045 (2.047) data 0.000 (0.002) loss 0.0638 (1.1753) lr 1.5878e-03 eta 1 day, 9:53:08
epoch [21/50] batch [420/2000] time 2.065 (2.047) data 0.000 (0.002) loss 0.3587 (1.1832) lr 1.5878e-03 eta 1 day, 9:52:26
epoch [21/50] batch [440/2000] time 2.076 (2.047) data 0.000 (0.002) loss 1.0058 (1.1662) lr 1.5878e-03 eta 1 day, 9:51:54
epoch [21/50] batch [460/2000] time 2.063 (2.047) data 0.000 (0.001) loss 1.5572 (1.1741) lr 1.5878e-03 eta 1 day, 9:51:07
epoch [21/50] batch [480/2000] time 2.085 (2.047) data 0.000 (0.001) loss 1.4967 (1.1816) lr 1.5878e-03 eta 1 day, 9:50:46
epoch [21/50] batch [500/2000] time 2.073 (2.047) data 0.000 (0.001) loss 0.7061 (1.1781) lr 1.5878e-03 eta 1 day, 9:50:08
epoch [21/50] batch [520/2000] time 2.062 (2.047) data 0.000 (0.001) loss 0.5596 (1.1783) lr 1.5878e-03 eta 1 day, 9:49:00
epoch [21/50] batch [540/2000] time 2.062 (2.047) data 0.000 (0.001) loss 0.4278 (1.1852) lr 1.5878e-03 eta 1 day, 9:48:10
epoch [21/50] batch [560/2000] time 2.039 (2.046) data 0.000 (0.001) loss 0.9920 (1.1923) lr 1.5878e-03 eta 1 day, 9:47:11
epoch [21/50] batch [580/2000] time 2.016 (2.046) data 0.000 (0.001) loss 0.4289 (1.1919) lr 1.5878e-03 eta 1 day, 9:46:26
epoch [21/50] batch [600/2000] time 2.042 (2.046) data 0.001 (0.001) loss 0.5735 (1.1927) lr 1.5878e-03 eta 1 day, 9:45:36
epoch [21/50] batch [620/2000] time 2.061 (2.046) data 0.000 (0.001) loss 0.8683 (1.1778) lr 1.5878e-03 eta 1 day, 9:44:57
epoch [21/50] batch [640/2000] time 1.984 (2.046) data 0.000 (0.001) loss 0.1938 (1.1841) lr 1.5878e-03 eta 1 day, 9:44:08
epoch [21/50] batch [660/2000] time 2.061 (2.046) data 0.000 (0.001) loss 0.2647 (1.1903) lr 1.5878e-03 eta 1 day, 9:43:24
epoch [21/50] batch [680/2000] time 2.049 (2.046) data 0.000 (0.001) loss 2.0167 (1.1845) lr 1.5878e-03 eta 1 day, 9:42:30
epoch [21/50] batch [700/2000] time 2.016 (2.046) data 0.001 (0.001) loss 0.9267 (1.1959) lr 1.5878e-03 eta 1 day, 9:42:01
epoch [21/50] batch [720/2000] time 1.986 (2.046) data 0.000 (0.001) loss 0.8636 (1.1994) lr 1.5878e-03 eta 1 day, 9:41:17
epoch [21/50] batch [740/2000] time 2.067 (2.046) data 0.000 (0.001) loss 1.9560 (1.2080) lr 1.5878e-03 eta 1 day, 9:40:26
epoch [21/50] batch [760/2000] time 2.066 (2.046) data 0.000 (0.001) loss 0.2930 (1.2034) lr 1.5878e-03 eta 1 day, 9:39:39
epoch [21/50] batch [780/2000] time 2.016 (2.046) data 0.000 (0.001) loss 1.6398 (1.2042) lr 1.5878e-03 eta 1 day, 9:39:12
epoch [21/50] batch [800/2000] time 2.009 (2.046) data 0.000 (0.001) loss 1.2202 (1.2036) lr 1.5878e-03 eta 1 day, 9:38:23
epoch [21/50] batch [820/2000] time 2.011 (2.046) data 0.000 (0.001) loss 1.8763 (1.2085) lr 1.5878e-03 eta 1 day, 9:37:36
epoch [21/50] batch [840/2000] time 2.051 (2.045) data 0.000 (0.001) loss 1.2208 (1.2064) lr 1.5878e-03 eta 1 day, 9:36:47
epoch [21/50] batch [860/2000] time 2.044 (2.045) data 0.000 (0.001) loss 1.5926 (1.2077) lr 1.5878e-03 eta 1 day, 9:36:07
epoch [21/50] batch [880/2000] time 2.016 (2.045) data 0.000 (0.001) loss 0.2301 (1.2051) lr 1.5878e-03 eta 1 day, 9:35:21
epoch [21/50] batch [900/2000] time 2.062 (2.045) data 0.000 (0.001) loss 1.2111 (1.2004) lr 1.5878e-03 eta 1 day, 9:34:33
epoch [21/50] batch [920/2000] time 2.059 (2.045) data 0.000 (0.001) loss 1.8646 (1.1982) lr 1.5878e-03 eta 1 day, 9:33:53
epoch [21/50] batch [940/2000] time 2.067 (2.045) data 0.000 (0.001) loss 2.9549 (1.2011) lr 1.5878e-03 eta 1 day, 9:33:15
epoch [21/50] batch [960/2000] time 2.040 (2.045) data 0.000 (0.001) loss 0.6759 (1.2010) lr 1.5878e-03 eta 1 day, 9:32:32
epoch [21/50] batch [980/2000] time 2.067 (2.045) data 0.000 (0.001) loss 2.3396 (1.1985) lr 1.5878e-03 eta 1 day, 9:31:46
epoch [21/50] batch [1000/2000] time 1.998 (2.045) data 0.000 (0.001) loss 0.0822 (1.1984) lr 1.5878e-03 eta 1 day, 9:31:08
epoch [21/50] batch [1020/2000] time 2.044 (2.045) data 0.000 (0.001) loss 1.8095 (1.1971) lr 1.5878e-03 eta 1 day, 9:30:24
epoch [21/50] batch [1040/2000] time 2.075 (2.045) data 0.002 (0.001) loss 0.7475 (1.1960) lr 1.5878e-03 eta 1 day, 9:29:29
epoch [21/50] batch [1060/2000] time 2.063 (2.045) data 0.000 (0.001) loss 1.4565 (1.1991) lr 1.5878e-03 eta 1 day, 9:28:46
epoch [21/50] batch [1080/2000] time 2.063 (2.045) data 0.000 (0.001) loss 0.5652 (1.2060) lr 1.5878e-03 eta 1 day, 9:28:04
epoch [21/50] batch [1100/2000] time 2.017 (2.045) data 0.000 (0.001) loss 0.6881 (1.2024) lr 1.5878e-03 eta 1 day, 9:27:16
epoch [21/50] batch [1120/2000] time 2.055 (2.045) data 0.000 (0.001) loss 1.0186 (1.2084) lr 1.5878e-03 eta 1 day, 9:26:34
epoch [21/50] batch [1140/2000] time 2.073 (2.045) data 0.001 (0.001) loss 0.5626 (1.2130) lr 1.5878e-03 eta 1 day, 9:25:59
epoch [21/50] batch [1160/2000] time 2.042 (2.045) data 0.000 (0.001) loss 0.5363 (1.2067) lr 1.5878e-03 eta 1 day, 9:25:11
epoch [21/50] batch [1180/2000] time 2.017 (2.045) data 0.000 (0.001) loss 0.4874 (1.2064) lr 1.5878e-03 eta 1 day, 9:24:31
epoch [21/50] batch [1200/2000] time 2.007 (2.045) data 0.000 (0.001) loss 0.6160 (1.2101) lr 1.5878e-03 eta 1 day, 9:23:46
epoch [21/50] batch [1220/2000] time 2.050 (2.045) data 0.000 (0.001) loss 0.8136 (1.2134) lr 1.5878e-03 eta 1 day, 9:23:01
epoch [21/50] batch [1240/2000] time 2.075 (2.045) data 0.000 (0.001) loss 0.3831 (1.2121) lr 1.5878e-03 eta 1 day, 9:22:19
epoch [21/50] batch [1260/2000] time 2.072 (2.045) data 0.000 (0.001) loss 0.2253 (1.2077) lr 1.5878e-03 eta 1 day, 9:21:35
epoch [21/50] batch [1280/2000] time 2.006 (2.044) data 0.000 (0.001) loss 0.2355 (1.2076) lr 1.5878e-03 eta 1 day, 9:20:50
epoch [21/50] batch [1300/2000] time 2.008 (2.044) data 0.000 (0.001) loss 0.0795 (1.2053) lr 1.5878e-03 eta 1 day, 9:20:05
epoch [21/50] batch [1320/2000] time 2.071 (2.044) data 0.000 (0.001) loss 0.6796 (1.2024) lr 1.5878e-03 eta 1 day, 9:19:22
epoch [21/50] batch [1340/2000] time 2.012 (2.044) data 0.000 (0.001) loss 3.3237 (1.2068) lr 1.5878e-03 eta 1 day, 9:18:42
epoch [21/50] batch [1360/2000] time 2.062 (2.044) data 0.000 (0.001) loss 0.2168 (1.2075) lr 1.5878e-03 eta 1 day, 9:18:02
epoch [21/50] batch [1380/2000] time 2.014 (2.044) data 0.000 (0.001) loss 0.7038 (1.2073) lr 1.5878e-03 eta 1 day, 9:17:21
epoch [21/50] batch [1400/2000] time 2.068 (2.044) data 0.000 (0.001) loss 1.8461 (1.2067) lr 1.5878e-03 eta 1 day, 9:16:44
epoch [21/50] batch [1420/2000] time 2.061 (2.044) data 0.000 (0.001) loss 1.4051 (1.2073) lr 1.5878e-03 eta 1 day, 9:15:55
epoch [21/50] batch [1440/2000] time 2.092 (2.045) data 0.000 (0.001) loss 1.4537 (1.2048) lr 1.5878e-03 eta 1 day, 9:15:26
epoch [21/50] batch [1460/2000] time 2.019 (2.045) data 0.000 (0.001) loss 2.3219 (1.2071) lr 1.5878e-03 eta 1 day, 9:14:55
epoch [21/50] batch [1480/2000] time 2.008 (2.045) data 0.000 (0.001) loss 2.2054 (1.2086) lr 1.5878e-03 eta 1 day, 9:14:18
epoch [21/50] batch [1500/2000] time 2.009 (2.045) data 0.000 (0.001) loss 0.7122 (1.2120) lr 1.5878e-03 eta 1 day, 9:13:38
epoch [21/50] batch [1520/2000] time 2.040 (2.045) data 0.000 (0.001) loss 0.6304 (1.2090) lr 1.5878e-03 eta 1 day, 9:12:54
epoch [21/50] batch [1540/2000] time 2.064 (2.045) data 0.000 (0.001) loss 0.5212 (1.2065) lr 1.5878e-03 eta 1 day, 9:12:14
epoch [21/50] batch [1560/2000] time 2.070 (2.045) data 0.000 (0.001) loss 0.4196 (1.2050) lr 1.5878e-03 eta 1 day, 9:11:33
epoch [21/50] batch [1580/2000] time 2.011 (2.045) data 0.000 (0.001) loss 0.6491 (1.2043) lr 1.5878e-03 eta 1 day, 9:10:49
epoch [21/50] batch [1600/2000] time 2.043 (2.045) data 0.000 (0.001) loss 1.4230 (1.2057) lr 1.5878e-03 eta 1 day, 9:10:14
epoch [21/50] batch [1620/2000] time 2.015 (2.045) data 0.000 (0.001) loss 0.1980 (1.2042) lr 1.5878e-03 eta 1 day, 9:09:31
epoch [21/50] batch [1640/2000] time 2.068 (2.045) data 0.000 (0.001) loss 0.1703 (1.2023) lr 1.5878e-03 eta 1 day, 9:08:47
epoch [21/50] batch [1660/2000] time 2.071 (2.045) data 0.000 (0.001) loss 1.5261 (1.2024) lr 1.5878e-03 eta 1 day, 9:08:04
epoch [21/50] batch [1680/2000] time 2.062 (2.045) data 0.001 (0.001) loss 0.5863 (1.2033) lr 1.5878e-03 eta 1 day, 9:07:22
epoch [21/50] batch [1700/2000] time 2.045 (2.045) data 0.000 (0.001) loss 3.4056 (1.2066) lr 1.5878e-03 eta 1 day, 9:06:40
epoch [21/50] batch [1720/2000] time 2.069 (2.045) data 0.000 (0.001) loss 0.3363 (1.2038) lr 1.5878e-03 eta 1 day, 9:05:58
epoch [21/50] batch [1740/2000] time 2.017 (2.045) data 0.000 (0.001) loss 1.4451 (1.2029) lr 1.5878e-03 eta 1 day, 9:05:12
epoch [21/50] batch [1760/2000] time 2.066 (2.045) data 0.000 (0.001) loss 3.0616 (1.2037) lr 1.5878e-03 eta 1 day, 9:04:32
epoch [21/50] batch [1780/2000] time 2.046 (2.044) data 0.000 (0.001) loss 1.5486 (1.2058) lr 1.5878e-03 eta 1 day, 9:03:50
epoch [21/50] batch [1800/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.5290 (1.2067) lr 1.5878e-03 eta 1 day, 9:03:08
epoch [21/50] batch [1820/2000] time 2.063 (2.044) data 0.000 (0.001) loss 1.1216 (1.2012) lr 1.5878e-03 eta 1 day, 9:02:28
epoch [21/50] batch [1840/2000] time 2.046 (2.044) data 0.000 (0.001) loss 2.2845 (1.2006) lr 1.5878e-03 eta 1 day, 9:01:47
epoch [21/50] batch [1860/2000] time 2.011 (2.044) data 0.000 (0.001) loss 0.1866 (1.2016) lr 1.5878e-03 eta 1 day, 9:01:06
epoch [21/50] batch [1880/2000] time 2.065 (2.044) data 0.000 (0.001) loss 4.6537 (1.2034) lr 1.5878e-03 eta 1 day, 9:00:20
epoch [21/50] batch [1900/2000] time 2.063 (2.044) data 0.000 (0.001) loss 1.6054 (1.2036) lr 1.5878e-03 eta 1 day, 8:59:39
epoch [21/50] batch [1920/2000] time 2.019 (2.044) data 0.000 (0.001) loss 0.9175 (1.2105) lr 1.5878e-03 eta 1 day, 8:58:53
epoch [21/50] batch [1940/2000] time 2.063 (2.044) data 0.002 (0.001) loss 0.3173 (1.2060) lr 1.5878e-03 eta 1 day, 8:58:13
epoch [21/50] batch [1960/2000] time 2.039 (2.044) data 0.000 (0.001) loss 0.7693 (1.2037) lr 1.5878e-03 eta 1 day, 8:57:32
epoch [21/50] batch [1980/2000] time 2.063 (2.044) data 0.000 (0.001) loss 1.0415 (1.2020) lr 1.5878e-03 eta 1 day, 8:56:53
epoch [21/50] batch [2000/2000] time 2.036 (2.044) data 0.000 (0.001) loss 1.2250 (1.2010) lr 1.5358e-03 eta 1 day, 8:56:10
epoch [22/50] batch [20/2000] time 2.061 (2.067) data 0.000 (0.028) loss 0.0644 (1.0526) lr 1.5358e-03 eta 1 day, 9:17:29
epoch [22/50] batch [40/2000] time 2.065 (2.058) data 0.000 (0.014) loss 0.3753 (1.0523) lr 1.5358e-03 eta 1 day, 9:07:58
epoch [22/50] batch [60/2000] time 2.063 (2.055) data 0.001 (0.009) loss 0.7113 (1.0560) lr 1.5358e-03 eta 1 day, 9:04:54
epoch [22/50] batch [80/2000] time 2.062 (2.050) data 0.000 (0.007) loss 0.6436 (1.1628) lr 1.5358e-03 eta 1 day, 8:58:37
epoch [22/50] batch [100/2000] time 2.020 (2.048) data 0.000 (0.006) loss 0.1718 (1.2048) lr 1.5358e-03 eta 1 day, 8:56:27
epoch [22/50] batch [120/2000] time 2.061 (2.048) data 0.000 (0.005) loss 2.8757 (1.2384) lr 1.5358e-03 eta 1 day, 8:55:15
epoch [22/50] batch [140/2000] time 2.008 (2.048) data 0.000 (0.004) loss 0.1895 (1.2216) lr 1.5358e-03 eta 1 day, 8:54:33
epoch [22/50] batch [160/2000] time 2.069 (2.047) data 0.000 (0.004) loss 3.3582 (1.2272) lr 1.5358e-03 eta 1 day, 8:53:26
epoch [22/50] batch [180/2000] time 2.020 (2.047) data 0.000 (0.003) loss 0.8589 (1.2121) lr 1.5358e-03 eta 1 day, 8:52:52
epoch [22/50] batch [200/2000] time 2.061 (2.047) data 0.000 (0.003) loss 2.9284 (1.2346) lr 1.5358e-03 eta 1 day, 8:52:08
epoch [22/50] batch [220/2000] time 2.063 (2.048) data 0.000 (0.003) loss 1.6044 (1.2212) lr 1.5358e-03 eta 1 day, 8:52:05
epoch [22/50] batch [240/2000] time 1.986 (2.047) data 0.000 (0.003) loss 0.3501 (1.2037) lr 1.5358e-03 eta 1 day, 8:50:55
epoch [22/50] batch [260/2000] time 2.084 (2.047) data 0.000 (0.002) loss 1.7354 (1.2274) lr 1.5358e-03 eta 1 day, 8:50:03
epoch [22/50] batch [280/2000] time 2.081 (2.047) data 0.000 (0.002) loss 1.1145 (1.2538) lr 1.5358e-03 eta 1 day, 8:49:26
epoch [22/50] batch [300/2000] time 2.064 (2.048) data 0.000 (0.002) loss 0.8611 (1.2766) lr 1.5358e-03 eta 1 day, 8:49:16
epoch [22/50] batch [320/2000] time 2.038 (2.048) data 0.000 (0.002) loss 1.7865 (1.2731) lr 1.5358e-03 eta 1 day, 8:48:23
epoch [22/50] batch [340/2000] time 2.041 (2.047) data 0.000 (0.002) loss 1.9137 (1.2841) lr 1.5358e-03 eta 1 day, 8:47:18
epoch [22/50] batch [360/2000] time 2.084 (2.047) data 0.000 (0.002) loss 0.9037 (1.2798) lr 1.5358e-03 eta 1 day, 8:46:57
epoch [22/50] batch [380/2000] time 2.039 (2.047) data 0.000 (0.002) loss 1.8950 (1.2741) lr 1.5358e-03 eta 1 day, 8:45:55
epoch [22/50] batch [400/2000] time 1.989 (2.047) data 0.000 (0.002) loss 1.1837 (1.2858) lr 1.5358e-03 eta 1 day, 8:45:17
epoch [22/50] batch [420/2000] time 2.070 (2.047) data 0.000 (0.002) loss 1.0965 (1.2901) lr 1.5358e-03 eta 1 day, 8:44:26
epoch [22/50] batch [440/2000] time 2.056 (2.047) data 0.000 (0.002) loss 1.3783 (1.2652) lr 1.5358e-03 eta 1 day, 8:44:00
epoch [22/50] batch [460/2000] time 2.047 (2.047) data 0.000 (0.001) loss 0.1401 (1.2715) lr 1.5358e-03 eta 1 day, 8:43:32
epoch [22/50] batch [480/2000] time 2.069 (2.047) data 0.000 (0.001) loss 1.4414 (1.2666) lr 1.5358e-03 eta 1 day, 8:42:44
epoch [22/50] batch [500/2000] time 2.015 (2.048) data 0.000 (0.001) loss 1.4990 (1.2599) lr 1.5358e-03 eta 1 day, 8:42:12
epoch [22/50] batch [520/2000] time 2.069 (2.047) data 0.000 (0.001) loss 0.5821 (1.2623) lr 1.5358e-03 eta 1 day, 8:41:14
epoch [22/50] batch [540/2000] time 2.069 (2.047) data 0.000 (0.001) loss 1.3830 (1.2519) lr 1.5358e-03 eta 1 day, 8:40:35
epoch [22/50] batch [560/2000] time 2.072 (2.047) data 0.000 (0.001) loss 0.1633 (1.2517) lr 1.5358e-03 eta 1 day, 8:39:53
epoch [22/50] batch [580/2000] time 2.073 (2.047) data 0.000 (0.001) loss 1.4949 (1.2506) lr 1.5358e-03 eta 1 day, 8:39:04
epoch [22/50] batch [600/2000] time 2.068 (2.047) data 0.001 (0.001) loss 0.8878 (1.2499) lr 1.5358e-03 eta 1 day, 8:38:17
epoch [22/50] batch [620/2000] time 2.013 (2.047) data 0.000 (0.001) loss 2.3888 (1.2484) lr 1.5358e-03 eta 1 day, 8:37:36
epoch [22/50] batch [640/2000] time 2.042 (2.047) data 0.000 (0.001) loss 0.8561 (1.2431) lr 1.5358e-03 eta 1 day, 8:36:51
epoch [22/50] batch [660/2000] time 2.013 (2.047) data 0.000 (0.001) loss 0.7007 (1.2361) lr 1.5358e-03 eta 1 day, 8:36:03
epoch [22/50] batch [680/2000] time 2.047 (2.047) data 0.000 (0.001) loss 0.6020 (1.2369) lr 1.5358e-03 eta 1 day, 8:35:20
epoch [22/50] batch [700/2000] time 2.064 (2.047) data 0.000 (0.001) loss 0.0944 (1.2261) lr 1.5358e-03 eta 1 day, 8:34:38
epoch [22/50] batch [720/2000] time 2.008 (2.047) data 0.000 (0.001) loss 0.4318 (1.2204) lr 1.5358e-03 eta 1 day, 8:33:59
epoch [22/50] batch [740/2000] time 2.010 (2.047) data 0.000 (0.001) loss 1.1043 (1.2214) lr 1.5358e-03 eta 1 day, 8:33:16
epoch [22/50] batch [760/2000] time 2.020 (2.047) data 0.000 (0.001) loss 1.7196 (1.2307) lr 1.5358e-03 eta 1 day, 8:32:29
epoch [22/50] batch [780/2000] time 2.065 (2.046) data 0.000 (0.001) loss 0.9287 (1.2268) lr 1.5358e-03 eta 1 day, 8:31:35
epoch [22/50] batch [800/2000] time 2.039 (2.047) data 0.000 (0.001) loss 0.0970 (1.2240) lr 1.5358e-03 eta 1 day, 8:31:12
epoch [22/50] batch [820/2000] time 2.047 (2.047) data 0.000 (0.001) loss 0.3155 (1.2226) lr 1.5358e-03 eta 1 day, 8:30:27
epoch [22/50] batch [840/2000] time 2.038 (2.047) data 0.000 (0.001) loss 0.8793 (1.2198) lr 1.5358e-03 eta 1 day, 8:29:40
epoch [22/50] batch [860/2000] time 2.080 (2.047) data 0.000 (0.001) loss 3.4741 (1.2253) lr 1.5358e-03 eta 1 day, 8:29:02
epoch [22/50] batch [880/2000] time 2.064 (2.047) data 0.000 (0.001) loss 0.1773 (1.2224) lr 1.5358e-03 eta 1 day, 8:28:18
epoch [22/50] batch [900/2000] time 2.070 (2.047) data 0.000 (0.001) loss 0.4126 (1.2294) lr 1.5358e-03 eta 1 day, 8:27:43
epoch [22/50] batch [920/2000] time 2.039 (2.047) data 0.000 (0.001) loss 0.3880 (1.2244) lr 1.5358e-03 eta 1 day, 8:27:00
epoch [22/50] batch [940/2000] time 2.020 (2.047) data 0.000 (0.001) loss 0.9139 (1.2207) lr 1.5358e-03 eta 1 day, 8:26:20
epoch [22/50] batch [960/2000] time 2.010 (2.047) data 0.003 (0.001) loss 1.9324 (1.2187) lr 1.5358e-03 eta 1 day, 8:25:41
epoch [22/50] batch [980/2000] time 2.066 (2.047) data 0.000 (0.001) loss 0.6332 (1.2208) lr 1.5358e-03 eta 1 day, 8:25:15
epoch [22/50] batch [1000/2000] time 2.014 (2.047) data 0.000 (0.001) loss 1.2826 (1.2150) lr 1.5358e-03 eta 1 day, 8:24:54
epoch [22/50] batch [1020/2000] time 2.014 (2.047) data 0.000 (0.001) loss 1.4867 (1.2177) lr 1.5358e-03 eta 1 day, 8:24:11
epoch [22/50] batch [1040/2000] time 2.045 (2.047) data 0.000 (0.001) loss 2.1528 (1.2160) lr 1.5358e-03 eta 1 day, 8:23:29
epoch [22/50] batch [1060/2000] time 2.070 (2.047) data 0.000 (0.001) loss 0.8385 (1.2193) lr 1.5358e-03 eta 1 day, 8:22:50
epoch [22/50] batch [1080/2000] time 2.047 (2.047) data 0.000 (0.001) loss 0.3805 (1.2176) lr 1.5358e-03 eta 1 day, 8:22:09
epoch [22/50] batch [1100/2000] time 1.991 (2.047) data 0.000 (0.001) loss 0.6673 (1.2087) lr 1.5358e-03 eta 1 day, 8:21:26
epoch [22/50] batch [1120/2000] time 2.012 (2.047) data 0.000 (0.001) loss 0.9566 (1.2202) lr 1.5358e-03 eta 1 day, 8:20:56
epoch [22/50] batch [1140/2000] time 2.051 (2.047) data 0.001 (0.001) loss 0.9738 (1.2189) lr 1.5358e-03 eta 1 day, 8:20:11
epoch [22/50] batch [1160/2000] time 2.071 (2.047) data 0.000 (0.001) loss 1.1123 (1.2194) lr 1.5358e-03 eta 1 day, 8:19:35
epoch [22/50] batch [1180/2000] time 2.011 (2.047) data 0.000 (0.001) loss 2.6520 (1.2191) lr 1.5358e-03 eta 1 day, 8:18:52
epoch [22/50] batch [1200/2000] time 2.072 (2.047) data 0.000 (0.001) loss 0.6299 (1.2213) lr 1.5358e-03 eta 1 day, 8:18:15
epoch [22/50] batch [1220/2000] time 2.013 (2.048) data 0.000 (0.001) loss 1.5120 (1.2195) lr 1.5358e-03 eta 1 day, 8:17:39
epoch [22/50] batch [1240/2000] time 2.076 (2.048) data 0.000 (0.001) loss 0.5022 (1.2191) lr 1.5358e-03 eta 1 day, 8:17:04
epoch [22/50] batch [1260/2000] time 2.073 (2.048) data 0.000 (0.001) loss 1.2301 (1.2203) lr 1.5358e-03 eta 1 day, 8:16:32
epoch [22/50] batch [1280/2000] time 2.046 (2.048) data 0.000 (0.001) loss 0.3680 (1.2178) lr 1.5358e-03 eta 1 day, 8:15:51
epoch [22/50] batch [1300/2000] time 2.001 (2.048) data 0.000 (0.001) loss 0.9068 (1.2160) lr 1.5358e-03 eta 1 day, 8:15:14
epoch [22/50] batch [1320/2000] time 2.076 (2.048) data 0.002 (0.001) loss 0.7014 (1.2098) lr 1.5358e-03 eta 1 day, 8:14:39
epoch [22/50] batch [1340/2000] time 2.072 (2.048) data 0.000 (0.001) loss 2.8831 (1.2120) lr 1.5358e-03 eta 1 day, 8:14:07
epoch [22/50] batch [1360/2000] time 2.046 (2.048) data 0.000 (0.001) loss 0.1404 (1.2147) lr 1.5358e-03 eta 1 day, 8:13:24
epoch [22/50] batch [1380/2000] time 2.070 (2.048) data 0.000 (0.001) loss 1.7857 (1.2121) lr 1.5358e-03 eta 1 day, 8:12:45
epoch [22/50] batch [1400/2000] time 2.068 (2.048) data 0.000 (0.001) loss 0.0811 (1.2093) lr 1.5358e-03 eta 1 day, 8:11:58
epoch [22/50] batch [1420/2000] time 1.989 (2.048) data 0.000 (0.001) loss 0.3028 (1.2088) lr 1.5358e-03 eta 1 day, 8:11:17
epoch [22/50] batch [1440/2000] time 2.075 (2.048) data 0.000 (0.001) loss 2.5442 (1.2063) lr 1.5358e-03 eta 1 day, 8:10:37
epoch [22/50] batch [1460/2000] time 2.042 (2.048) data 0.000 (0.001) loss 0.2832 (1.2008) lr 1.5358e-03 eta 1 day, 8:09:58
epoch [22/50] batch [1480/2000] time 2.073 (2.048) data 0.000 (0.001) loss 0.4849 (1.2012) lr 1.5358e-03 eta 1 day, 8:09:17
epoch [22/50] batch [1500/2000] time 2.067 (2.048) data 0.000 (0.001) loss 1.1138 (1.2024) lr 1.5358e-03 eta 1 day, 8:08:38
epoch [22/50] batch [1520/2000] time 2.072 (2.048) data 0.000 (0.001) loss 0.3032 (1.2031) lr 1.5358e-03 eta 1 day, 8:07:57
epoch [22/50] batch [1540/2000] time 2.045 (2.048) data 0.000 (0.001) loss 1.2573 (1.2018) lr 1.5358e-03 eta 1 day, 8:07:16
epoch [22/50] batch [1560/2000] time 2.013 (2.048) data 0.000 (0.001) loss 0.6792 (1.1991) lr 1.5358e-03 eta 1 day, 8:06:34
epoch [22/50] batch [1580/2000] time 2.074 (2.048) data 0.000 (0.001) loss 2.3353 (1.2030) lr 1.5358e-03 eta 1 day, 8:05:45
epoch [22/50] batch [1600/2000] time 2.042 (2.048) data 0.000 (0.001) loss 0.8193 (1.2040) lr 1.5358e-03 eta 1 day, 8:05:02
epoch [22/50] batch [1620/2000] time 2.010 (2.048) data 0.000 (0.001) loss 0.1114 (1.2054) lr 1.5358e-03 eta 1 day, 8:04:19
epoch [22/50] batch [1640/2000] time 2.072 (2.048) data 0.000 (0.001) loss 0.8992 (1.2046) lr 1.5358e-03 eta 1 day, 8:03:39
epoch [22/50] batch [1660/2000] time 2.068 (2.048) data 0.000 (0.001) loss 1.8811 (1.2006) lr 1.5358e-03 eta 1 day, 8:03:00
epoch [22/50] batch [1680/2000] time 2.068 (2.048) data 0.001 (0.001) loss 4.9694 (1.2032) lr 1.5358e-03 eta 1 day, 8:02:17
epoch [22/50] batch [1700/2000] time 2.074 (2.048) data 0.000 (0.001) loss 0.0747 (1.2053) lr 1.5358e-03 eta 1 day, 8:01:43
epoch [22/50] batch [1720/2000] time 2.045 (2.048) data 0.000 (0.001) loss 0.6579 (1.2091) lr 1.5358e-03 eta 1 day, 8:00:56
epoch [22/50] batch [1740/2000] time 2.070 (2.048) data 0.000 (0.001) loss 0.4860 (1.2098) lr 1.5358e-03 eta 1 day, 8:00:20
epoch [22/50] batch [1760/2000] time 2.013 (2.048) data 0.000 (0.001) loss 1.4083 (1.2105) lr 1.5358e-03 eta 1 day, 7:59:36
epoch [22/50] batch [1780/2000] time 2.078 (2.048) data 0.000 (0.001) loss 0.4417 (1.2093) lr 1.5358e-03 eta 1 day, 7:58:53
epoch [22/50] batch [1800/2000] time 2.025 (2.048) data 0.000 (0.001) loss 1.1548 (1.2075) lr 1.5358e-03 eta 1 day, 7:58:13
epoch [22/50] batch [1820/2000] time 2.047 (2.048) data 0.001 (0.001) loss 0.4609 (1.2080) lr 1.5358e-03 eta 1 day, 7:57:28
epoch [22/50] batch [1840/2000] time 2.084 (2.048) data 0.000 (0.001) loss 2.1236 (1.2083) lr 1.5358e-03 eta 1 day, 7:56:51
epoch [22/50] batch [1860/2000] time 2.095 (2.048) data 0.000 (0.001) loss 0.4783 (1.2087) lr 1.5358e-03 eta 1 day, 7:56:18
epoch [22/50] batch [1880/2000] time 2.028 (2.048) data 0.000 (0.001) loss 1.1694 (1.2073) lr 1.5358e-03 eta 1 day, 7:55:41
epoch [22/50] batch [1900/2000] time 2.094 (2.048) data 0.000 (0.001) loss 0.3198 (1.2029) lr 1.5358e-03 eta 1 day, 7:55:12
epoch [22/50] batch [1920/2000] time 2.080 (2.049) data 0.000 (0.001) loss 1.8163 (1.2039) lr 1.5358e-03 eta 1 day, 7:54:43
epoch [22/50] batch [1940/2000] time 1.986 (2.048) data 0.000 (0.001) loss 0.2769 (1.2056) lr 1.5358e-03 eta 1 day, 7:53:58
epoch [22/50] batch [1960/2000] time 2.046 (2.048) data 0.000 (0.001) loss 0.1299 (1.2058) lr 1.5358e-03 eta 1 day, 7:53:16
epoch [22/50] batch [1980/2000] time 2.064 (2.048) data 0.000 (0.001) loss 1.1853 (1.2067) lr 1.5358e-03 eta 1 day, 7:52:35
epoch [22/50] batch [2000/2000] time 2.067 (2.048) data 0.000 (0.001) loss 1.4844 (1.2068) lr 1.4818e-03 eta 1 day, 7:51:52
epoch [23/50] batch [20/2000] time 2.052 (2.088) data 0.000 (0.035) loss 0.3573 (1.1189) lr 1.4818e-03 eta 1 day, 8:28:02
epoch [23/50] batch [40/2000] time 2.074 (2.066) data 0.000 (0.018) loss 1.2914 (0.9020) lr 1.4818e-03 eta 1 day, 8:06:44
epoch [23/50] batch [60/2000] time 2.045 (2.059) data 0.001 (0.012) loss 0.2294 (1.1179) lr 1.4818e-03 eta 1 day, 7:59:46
epoch [23/50] batch [80/2000] time 2.014 (2.055) data 0.000 (0.009) loss 1.4179 (1.1568) lr 1.4818e-03 eta 1 day, 7:55:00
epoch [23/50] batch [100/2000] time 2.069 (2.055) data 0.000 (0.007) loss 2.1594 (1.1975) lr 1.4818e-03 eta 1 day, 7:54:39
epoch [23/50] batch [120/2000] time 2.069 (2.055) data 0.000 (0.006) loss 0.5889 (1.1391) lr 1.4818e-03 eta 1 day, 7:53:38
epoch [23/50] batch [140/2000] time 2.068 (2.054) data 0.000 (0.005) loss 1.4158 (1.1495) lr 1.4818e-03 eta 1 day, 7:52:09
epoch [23/50] batch [160/2000] time 2.055 (2.054) data 0.000 (0.005) loss 0.7503 (1.1477) lr 1.4818e-03 eta 1 day, 7:51:11
epoch [23/50] batch [180/2000] time 2.066 (2.053) data 0.000 (0.004) loss 0.1071 (1.1873) lr 1.4818e-03 eta 1 day, 7:50:08
epoch [23/50] batch [200/2000] time 2.081 (2.053) data 0.000 (0.004) loss 0.8695 (1.1963) lr 1.4818e-03 eta 1 day, 7:49:29
epoch [23/50] batch [220/2000] time 2.009 (2.052) data 0.000 (0.004) loss 0.7359 (1.2072) lr 1.4818e-03 eta 1 day, 7:48:06
epoch [23/50] batch [240/2000] time 2.073 (2.052) data 0.000 (0.004) loss 0.5990 (1.2211) lr 1.4818e-03 eta 1 day, 7:47:05
epoch [23/50] batch [260/2000] time 2.091 (2.052) data 0.001 (0.003) loss 0.4142 (1.2192) lr 1.4818e-03 eta 1 day, 7:46:13
epoch [23/50] batch [280/2000] time 2.074 (2.051) data 0.000 (0.003) loss 3.0931 (1.2331) lr 1.4818e-03 eta 1 day, 7:45:07
epoch [23/50] batch [300/2000] time 2.070 (2.052) data 0.000 (0.003) loss 1.0620 (1.2062) lr 1.4818e-03 eta 1 day, 7:44:44
epoch [23/50] batch [320/2000] time 1.989 (2.051) data 0.000 (0.003) loss 0.6552 (1.2206) lr 1.4818e-03 eta 1 day, 7:43:27
epoch [23/50] batch [340/2000] time 2.080 (2.051) data 0.000 (0.003) loss 1.1419 (1.2216) lr 1.4818e-03 eta 1 day, 7:42:28
epoch [23/50] batch [360/2000] time 2.044 (2.051) data 0.000 (0.002) loss 0.3866 (1.2062) lr 1.4818e-03 eta 1 day, 7:41:30
epoch [23/50] batch [380/2000] time 2.070 (2.050) data 0.000 (0.002) loss 0.1393 (1.2088) lr 1.4818e-03 eta 1 day, 7:40:44
epoch [23/50] batch [400/2000] time 2.072 (2.050) data 0.000 (0.002) loss 1.5803 (1.2056) lr 1.4818e-03 eta 1 day, 7:39:47
epoch [23/50] batch [420/2000] time 2.016 (2.050) data 0.000 (0.002) loss 1.4607 (1.1987) lr 1.4818e-03 eta 1 day, 7:38:51
epoch [23/50] batch [440/2000] time 2.075 (2.050) data 0.000 (0.002) loss 0.2458 (1.2062) lr 1.4818e-03 eta 1 day, 7:38:39
epoch [23/50] batch [460/2000] time 2.089 (2.051) data 0.000 (0.002) loss 1.1288 (1.2069) lr 1.4818e-03 eta 1 day, 7:38:51
epoch [23/50] batch [480/2000] time 2.069 (2.052) data 0.000 (0.002) loss 2.4938 (1.2005) lr 1.4818e-03 eta 1 day, 7:38:20
epoch [23/50] batch [500/2000] time 2.046 (2.051) data 0.000 (0.002) loss 1.1775 (1.1992) lr 1.4818e-03 eta 1 day, 7:37:37
epoch [23/50] batch [520/2000] time 2.419 (2.054) data 0.000 (0.002) loss 0.8082 (1.2016) lr 1.4818e-03 eta 1 day, 7:39:29
epoch [23/50] batch [540/2000] time 1.990 (2.062) data 0.000 (0.002) loss 1.3897 (1.1984) lr 1.4818e-03 eta 1 day, 7:46:14
epoch [23/50] batch [560/2000] time 2.040 (2.062) data 0.000 (0.002) loss 0.9632 (1.2076) lr 1.4818e-03 eta 1 day, 7:45:04
epoch [23/50] batch [580/2000] time 2.043 (2.061) data 0.000 (0.002) loss 0.0896 (1.1995) lr 1.4818e-03 eta 1 day, 7:43:40
epoch [23/50] batch [600/2000] time 2.012 (2.061) data 0.001 (0.002) loss 1.1721 (1.1953) lr 1.4818e-03 eta 1 day, 7:42:42
epoch [23/50] batch [620/2000] time 1.985 (2.060) data 0.000 (0.002) loss 0.3084 (1.1936) lr 1.4818e-03 eta 1 day, 7:41:10
epoch [23/50] batch [640/2000] time 2.008 (2.059) data 0.000 (0.002) loss 2.1440 (1.1875) lr 1.4818e-03 eta 1 day, 7:40:06
epoch [23/50] batch [660/2000] time 2.046 (2.059) data 0.000 (0.002) loss 1.6942 (1.2036) lr 1.4818e-03 eta 1 day, 7:38:51
epoch [23/50] batch [680/2000] time 2.022 (2.058) data 0.000 (0.001) loss 0.8007 (1.2014) lr 1.4818e-03 eta 1 day, 7:37:50
epoch [23/50] batch [700/2000] time 2.066 (2.058) data 0.000 (0.002) loss 0.8694 (1.1970) lr 1.4818e-03 eta 1 day, 7:36:56
epoch [23/50] batch [720/2000] time 2.043 (2.058) data 0.000 (0.002) loss 0.0456 (1.1844) lr 1.4818e-03 eta 1 day, 7:36:02
epoch [23/50] batch [740/2000] time 2.020 (2.058) data 0.000 (0.001) loss 0.2436 (1.1765) lr 1.4818e-03 eta 1 day, 7:35:09
epoch [23/50] batch [760/2000] time 2.047 (2.057) data 0.000 (0.001) loss 2.6809 (1.1703) lr 1.4818e-03 eta 1 day, 7:34:12
epoch [23/50] batch [780/2000] time 2.162 (2.059) data 0.000 (0.001) loss 0.5487 (1.1672) lr 1.4818e-03 eta 1 day, 7:34:31
epoch [23/50] batch [800/2000] time 2.436 (2.068) data 0.000 (0.001) loss 1.3005 (1.1640) lr 1.4818e-03 eta 1 day, 7:42:12
epoch [23/50] batch [820/2000] time 2.142 (2.070) data 0.000 (0.001) loss 2.2121 (1.1644) lr 1.4818e-03 eta 1 day, 7:43:44
epoch [23/50] batch [840/2000] time 2.065 (2.070) data 0.000 (0.001) loss 1.4674 (1.1625) lr 1.4818e-03 eta 1 day, 7:43:02
epoch [23/50] batch [860/2000] time 2.071 (2.070) data 0.000 (0.001) loss 2.3000 (1.1667) lr 1.4818e-03 eta 1 day, 7:41:55
epoch [23/50] batch [880/2000] time 2.012 (2.069) data 0.000 (0.001) loss 0.1586 (1.1654) lr 1.4818e-03 eta 1 day, 7:41:04
epoch [23/50] batch [900/2000] time 2.070 (2.069) data 0.000 (0.001) loss 4.1546 (1.1670) lr 1.4818e-03 eta 1 day, 7:40:02
epoch [23/50] batch [920/2000] time 2.073 (2.069) data 0.000 (0.001) loss 0.5185 (1.1684) lr 1.4818e-03 eta 1 day, 7:39:09
epoch [23/50] batch [940/2000] time 2.389 (2.075) data 0.000 (0.001) loss 1.0588 (1.1706) lr 1.4818e-03 eta 1 day, 7:44:09
epoch [23/50] batch [960/2000] time 2.145 (2.078) data 0.000 (0.001) loss 0.2626 (1.1694) lr 1.4818e-03 eta 1 day, 7:46:32
epoch [23/50] batch [980/2000] time 2.169 (2.080) data 0.000 (0.001) loss 2.5624 (1.1665) lr 1.4818e-03 eta 1 day, 7:47:26
epoch [23/50] batch [1000/2000] time 2.440 (2.085) data 0.000 (0.001) loss 0.5914 (1.1658) lr 1.4818e-03 eta 1 day, 7:51:32
epoch [23/50] batch [1020/2000] time 2.133 (2.089) data 0.000 (0.001) loss 0.2522 (1.1683) lr 1.4818e-03 eta 1 day, 7:54:38
epoch [23/50] batch [1040/2000] time 2.138 (2.091) data 0.000 (0.001) loss 0.6610 (1.1722) lr 1.4818e-03 eta 1 day, 7:55:02
epoch [23/50] batch [1060/2000] time 2.367 (2.095) data 0.000 (0.001) loss 0.7201 (1.1747) lr 1.4818e-03 eta 1 day, 7:58:24
epoch [23/50] batch [1080/2000] time 2.185 (2.099) data 0.000 (0.001) loss 2.7149 (1.1765) lr 1.4818e-03 eta 1 day, 8:01:02
epoch [23/50] batch [1100/2000] time 2.102 (2.100) data 0.000 (0.001) loss 1.5929 (1.1763) lr 1.4818e-03 eta 1 day, 8:01:19
epoch [23/50] batch [1120/2000] time 2.386 (2.104) data 0.000 (0.001) loss 0.6849 (1.1767) lr 1.4818e-03 eta 1 day, 8:04:09
epoch [23/50] batch [1140/2000] time 2.161 (2.107) data 0.001 (0.001) loss 1.1901 (1.1728) lr 1.4818e-03 eta 1 day, 8:06:46
epoch [23/50] batch [1160/2000] time 2.184 (2.108) data 0.000 (0.001) loss 1.3035 (1.1735) lr 1.4818e-03 eta 1 day, 8:06:47
epoch [23/50] batch [1180/2000] time 2.451 (2.111) data 0.000 (0.001) loss 3.5517 (1.1804) lr 1.4818e-03 eta 1 day, 8:08:57
epoch [23/50] batch [1200/2000] time 2.128 (2.115) data 0.000 (0.001) loss 1.8572 (1.1795) lr 1.4818e-03 eta 1 day, 8:11:23
epoch [23/50] batch [1220/2000] time 2.182 (2.115) data 0.000 (0.001) loss 1.4599 (1.1738) lr 1.4818e-03 eta 1 day, 8:11:13
epoch [23/50] batch [1240/2000] time 2.422 (2.118) data 0.005 (0.001) loss 0.8565 (1.1682) lr 1.4818e-03 eta 1 day, 8:12:42
epoch [23/50] batch [1260/2000] time 2.194 (2.121) data 0.000 (0.001) loss 4.7435 (1.1741) lr 1.4818e-03 eta 1 day, 8:15:30
epoch [23/50] batch [1280/2000] time 2.182 (2.122) data 0.000 (0.001) loss 0.1807 (1.1729) lr 1.4818e-03 eta 1 day, 8:15:24
epoch [23/50] batch [1300/2000] time 2.386 (2.124) data 0.000 (0.001) loss 1.5882 (1.1753) lr 1.4818e-03 eta 1 day, 8:16:28
epoch [23/50] batch [1320/2000] time 2.125 (2.128) data 0.000 (0.001) loss 2.6165 (1.1734) lr 1.4818e-03 eta 1 day, 8:19:07
epoch [23/50] batch [1340/2000] time 2.123 (2.128) data 0.000 (0.001) loss 3.1403 (1.1761) lr 1.4818e-03 eta 1 day, 8:18:42
epoch [23/50] batch [1360/2000] time 2.463 (2.130) data 0.000 (0.001) loss 0.8024 (1.1775) lr 1.4818e-03 eta 1 day, 8:19:27
epoch [23/50] batch [1380/2000] time 2.175 (2.133) data 0.000 (0.001) loss 0.7482 (1.1787) lr 1.4818e-03 eta 1 day, 8:22:04
epoch [23/50] batch [1400/2000] time 2.155 (2.134) data 0.000 (0.001) loss 1.9476 (1.1769) lr 1.4818e-03 eta 1 day, 8:21:40
epoch [23/50] batch [1420/2000] time 2.511 (2.135) data 0.000 (0.001) loss 0.4447 (1.1720) lr 1.4818e-03 eta 1 day, 8:21:45
epoch [23/50] batch [1440/2000] time 2.444 (2.139) data 0.000 (0.001) loss 0.2650 (1.1748) lr 1.4818e-03 eta 1 day, 8:24:36
epoch [23/50] batch [1460/2000] time 2.181 (2.139) data 0.000 (0.001) loss 1.7096 (1.1754) lr 1.4818e-03 eta 1 day, 8:24:04
epoch [23/50] batch [1480/2000] time 2.419 (2.139) data 0.000 (0.001) loss 3.7052 (1.1832) lr 1.4818e-03 eta 1 day, 8:23:42
epoch [23/50] batch [1500/2000] time 2.471 (2.143) data 0.000 (0.001) loss 1.2576 (1.1876) lr 1.4818e-03 eta 1 day, 8:26:29
epoch [23/50] batch [1520/2000] time 2.130 (2.143) data 0.000 (0.001) loss 4.2265 (1.1887) lr 1.4818e-03 eta 1 day, 8:26:05
epoch [23/50] batch [1540/2000] time 2.116 (2.143) data 0.000 (0.001) loss 0.1217 (1.1936) lr 1.4818e-03 eta 1 day, 8:25:31
epoch [23/50] batch [1560/2000] time 2.392 (2.147) data 0.003 (0.001) loss 1.3840 (1.1967) lr 1.4818e-03 eta 1 day, 8:27:45
epoch [23/50] batch [1580/2000] time 2.176 (2.148) data 0.001 (0.001) loss 0.2210 (1.1936) lr 1.4818e-03 eta 1 day, 8:27:55
epoch [23/50] batch [1600/2000] time 2.097 (2.148) data 0.000 (0.001) loss 0.5546 (1.1892) lr 1.4818e-03 eta 1 day, 8:27:12
epoch [23/50] batch [1620/2000] time 2.386 (2.150) data 0.000 (0.001) loss 0.8512 (1.1859) lr 1.4818e-03 eta 1 day, 8:29:02
epoch [23/50] batch [1640/2000] time 2.120 (2.152) data 0.000 (0.001) loss 1.9208 (1.1868) lr 1.4818e-03 eta 1 day, 8:29:19
epoch [23/50] batch [1660/2000] time 2.207 (2.152) data 0.000 (0.001) loss 0.9238 (1.1867) lr 1.4818e-03 eta 1 day, 8:28:39
epoch [23/50] batch [1680/2000] time 2.379 (2.154) data 0.001 (0.001) loss 1.0418 (1.1936) lr 1.4818e-03 eta 1 day, 8:30:07
epoch [23/50] batch [1700/2000] time 2.175 (2.155) data 0.000 (0.001) loss 2.4971 (1.1956) lr 1.4818e-03 eta 1 day, 8:30:28
epoch [23/50] batch [1720/2000] time 2.121 (2.155) data 0.000 (0.001) loss 2.6584 (1.1969) lr 1.4818e-03 eta 1 day, 8:29:43
epoch [23/50] batch [1740/2000] time 2.414 (2.157) data 0.000 (0.001) loss 1.2235 (1.1958) lr 1.4818e-03 eta 1 day, 8:30:45
epoch [23/50] batch [1760/2000] time 2.178 (2.159) data 0.000 (0.001) loss 1.0204 (1.1949) lr 1.4818e-03 eta 1 day, 8:31:22
epoch [23/50] batch [1780/2000] time 2.130 (2.159) data 0.000 (0.001) loss 2.2170 (1.1949) lr 1.4818e-03 eta 1 day, 8:30:38
epoch [23/50] batch [1800/2000] time 2.359 (2.161) data 0.000 (0.001) loss 0.8863 (1.1953) lr 1.4818e-03 eta 1 day, 8:31:40
epoch [23/50] batch [1820/2000] time 2.100 (2.162) data 0.000 (0.001) loss 0.2963 (1.1982) lr 1.4818e-03 eta 1 day, 8:32:10
epoch [23/50] batch [1840/2000] time 2.143 (2.162) data 0.000 (0.001) loss 2.7523 (1.1963) lr 1.4818e-03 eta 1 day, 8:31:10
epoch [23/50] batch [1860/2000] time 2.408 (2.162) data 0.000 (0.001) loss 0.7655 (1.1982) lr 1.4818e-03 eta 1 day, 8:30:58
epoch [23/50] batch [1880/2000] time 2.171 (2.164) data 0.000 (0.001) loss 0.9601 (1.1996) lr 1.4818e-03 eta 1 day, 8:32:18
epoch [23/50] batch [1900/2000] time 2.169 (2.164) data 0.000 (0.001) loss 0.0197 (1.1995) lr 1.4818e-03 eta 1 day, 8:31:19
epoch [23/50] batch [1920/2000] time 2.272 (2.164) data 0.000 (0.001) loss 1.8990 (1.2011) lr 1.4818e-03 eta 1 day, 8:30:21
epoch [23/50] batch [1940/2000] time 2.414 (2.166) data 0.000 (0.001) loss 1.0774 (1.2005) lr 1.4818e-03 eta 1 day, 8:31:39
epoch [23/50] batch [1960/2000] time 2.099 (2.166) data 0.000 (0.001) loss 1.7487 (1.2035) lr 1.4818e-03 eta 1 day, 8:31:07
epoch [23/50] batch [1980/2000] time 2.175 (2.166) data 0.000 (0.001) loss 0.4397 (1.2033) lr 1.4818e-03 eta 1 day, 8:30:06
epoch [23/50] batch [2000/2000] time 2.429 (2.167) data 0.000 (0.001) loss 0.2524 (1.2029) lr 1.4258e-03 eta 1 day, 8:30:30
epoch [24/50] batch [20/2000] time 2.068 (2.282) data 0.000 (0.031) loss 0.5904 (1.2795) lr 1.4258e-03 eta 1 day, 10:12:44
epoch [24/50] batch [40/2000] time 2.119 (2.207) data 0.000 (0.016) loss 0.7338 (1.1748) lr 1.4258e-03 eta 1 day, 9:04:31
epoch [24/50] batch [60/2000] time 1.981 (2.183) data 0.001 (0.011) loss 0.8143 (1.2334) lr 1.4258e-03 eta 1 day, 8:42:22
epoch [24/50] batch [80/2000] time 2.061 (2.148) data 0.000 (0.008) loss 2.2370 (1.3385) lr 1.4258e-03 eta 1 day, 8:10:23
epoch [24/50] batch [100/2000] time 2.056 (2.126) data 0.000 (0.006) loss 2.5189 (1.2620) lr 1.4258e-03 eta 1 day, 7:50:15
epoch [24/50] batch [120/2000] time 1.982 (2.111) data 0.000 (0.005) loss 1.2573 (1.2286) lr 1.4258e-03 eta 1 day, 7:35:28
epoch [24/50] batch [140/2000] time 2.033 (2.100) data 0.000 (0.005) loss 1.1246 (1.1998) lr 1.4258e-03 eta 1 day, 7:25:28
epoch [24/50] batch [160/2000] time 2.000 (2.091) data 0.000 (0.004) loss 0.3177 (1.1889) lr 1.4258e-03 eta 1 day, 7:16:09
epoch [24/50] batch [180/2000] time 2.065 (2.084) data 0.000 (0.004) loss 2.3144 (1.2197) lr 1.4258e-03 eta 1 day, 7:09:23
epoch [24/50] batch [200/2000] time 2.067 (2.080) data 0.000 (0.003) loss 2.2436 (1.2291) lr 1.4258e-03 eta 1 day, 7:04:40
epoch [24/50] batch [220/2000] time 2.057 (2.076) data 0.000 (0.003) loss 2.8220 (1.2216) lr 1.4258e-03 eta 1 day, 7:00:46
epoch [24/50] batch [240/2000] time 2.032 (2.073) data 0.000 (0.003) loss 1.1244 (1.2141) lr 1.4258e-03 eta 1 day, 6:57:30
epoch [24/50] batch [260/2000] time 2.493 (2.093) data 0.000 (0.003) loss 1.2172 (1.1913) lr 1.4258e-03 eta 1 day, 7:14:21
epoch [24/50] batch [280/2000] time 2.164 (2.105) data 0.000 (0.003) loss 0.7774 (1.1857) lr 1.4258e-03 eta 1 day, 7:24:19
epoch [24/50] batch [300/2000] time 2.149 (2.107) data 0.000 (0.002) loss 0.4242 (1.1913) lr 1.4258e-03 eta 1 day, 7:26:06
epoch [24/50] batch [320/2000] time 2.361 (2.122) data 0.000 (0.002) loss 1.2993 (1.1734) lr 1.4258e-03 eta 1 day, 7:38:20
epoch [24/50] batch [340/2000] time 2.147 (2.130) data 0.000 (0.002) loss 0.6040 (1.1604) lr 1.4258e-03 eta 1 day, 7:44:32
epoch [24/50] batch [360/2000] time 2.142 (2.130) data 0.000 (0.002) loss 1.9822 (1.1692) lr 1.4258e-03 eta 1 day, 7:44:30
epoch [24/50] batch [380/2000] time 2.426 (2.141) data 0.000 (0.002) loss 0.7293 (1.1707) lr 1.4258e-03 eta 1 day, 7:52:54
epoch [24/50] batch [400/2000] time 2.146 (2.147) data 0.000 (0.002) loss 2.1191 (1.1700) lr 1.4258e-03 eta 1 day, 7:57:54
epoch [24/50] batch [420/2000] time 2.180 (2.146) data 0.000 (0.002) loss 0.0339 (1.1765) lr 1.4258e-03 eta 1 day, 7:56:42
epoch [24/50] batch [440/2000] time 2.432 (2.153) data 0.000 (0.002) loss 1.4093 (1.1867) lr 1.4258e-03 eta 1 day, 8:02:08
epoch [24/50] batch [460/2000] time 2.097 (2.159) data 0.000 (0.002) loss 1.0675 (1.2031) lr 1.4258e-03 eta 1 day, 8:06:39
epoch [24/50] batch [480/2000] time 2.166 (2.158) data 0.000 (0.002) loss 1.6528 (1.2065) lr 1.4258e-03 eta 1 day, 8:04:49
epoch [24/50] batch [500/2000] time 2.430 (2.163) data 0.000 (0.002) loss 0.2441 (1.2082) lr 1.4258e-03 eta 1 day, 8:08:28
epoch [24/50] batch [520/2000] time 2.148 (2.169) data 0.000 (0.002) loss 3.4674 (1.2191) lr 1.4258e-03 eta 1 day, 8:13:00
epoch [24/50] batch [540/2000] time 2.171 (2.168) data 0.000 (0.001) loss 1.1198 (1.2154) lr 1.4258e-03 eta 1 day, 8:11:23
epoch [24/50] batch [560/2000] time 2.428 (2.170) data 0.000 (0.001) loss 1.4360 (1.2199) lr 1.4258e-03 eta 1 day, 8:12:22
epoch [24/50] batch [580/2000] time 2.134 (2.177) data 0.000 (0.001) loss 0.4148 (1.2188) lr 1.4258e-03 eta 1 day, 8:18:06
epoch [24/50] batch [600/2000] time 2.119 (2.176) data 0.001 (0.001) loss 0.4795 (1.2152) lr 1.4258e-03 eta 1 day, 8:16:24
epoch [24/50] batch [620/2000] time 2.443 (2.175) data 0.000 (0.001) loss 0.3667 (1.2075) lr 1.4258e-03 eta 1 day, 8:15:05
epoch [24/50] batch [640/2000] time 2.432 (2.182) data 0.000 (0.001) loss 1.3734 (1.2062) lr 1.4258e-03 eta 1 day, 8:20:18
epoch [24/50] batch [660/2000] time 2.149 (2.182) data 0.000 (0.001) loss 0.2510 (1.2051) lr 1.4258e-03 eta 1 day, 8:19:32
epoch [24/50] batch [680/2000] time 2.110 (2.181) data 0.000 (0.001) loss 0.2671 (1.1995) lr 1.4258e-03 eta 1 day, 8:17:53
epoch [24/50] batch [700/2000] time 2.339 (2.185) data 0.000 (0.001) loss 0.4837 (1.2072) lr 1.4258e-03 eta 1 day, 8:21:16
epoch [24/50] batch [720/2000] time 2.127 (2.187) data 0.000 (0.001) loss 0.4413 (1.2189) lr 1.4258e-03 eta 1 day, 8:21:53
epoch [24/50] batch [740/2000] time 2.092 (2.185) data 0.000 (0.001) loss 0.7312 (1.2138) lr 1.4258e-03 eta 1 day, 8:19:52
epoch [24/50] batch [760/2000] time 2.400 (2.188) data 0.000 (0.001) loss 1.8513 (1.2092) lr 1.4258e-03 eta 1 day, 8:21:23
epoch [24/50] batch [780/2000] time 2.166 (2.191) data 0.000 (0.001) loss 0.1049 (1.2073) lr 1.4258e-03 eta 1 day, 8:23:02
epoch [24/50] batch [800/2000] time 2.169 (2.189) data 0.000 (0.001) loss 0.0421 (1.2024) lr 1.4258e-03 eta 1 day, 8:21:03
epoch [24/50] batch [820/2000] time 2.460 (2.190) data 0.000 (0.001) loss 2.6328 (1.2063) lr 1.4258e-03 eta 1 day, 8:21:27
epoch [24/50] batch [840/2000] time 2.155 (2.194) data 0.000 (0.001) loss 0.4986 (1.2009) lr 1.4258e-03 eta 1 day, 8:23:53
epoch [24/50] batch [860/2000] time 2.089 (2.193) data 0.000 (0.001) loss 0.3585 (1.1972) lr 1.4258e-03 eta 1 day, 8:22:05
epoch [24/50] batch [880/2000] time 2.436 (2.193) data 0.000 (0.001) loss 0.4961 (1.1930) lr 1.4258e-03 eta 1 day, 8:21:15
epoch [24/50] batch [900/2000] time 2.155 (2.197) data 0.000 (0.001) loss 0.3395 (1.1934) lr 1.4258e-03 eta 1 day, 8:24:45
epoch [24/50] batch [920/2000] time 2.181 (2.196) data 0.000 (0.001) loss 1.2698 (1.1904) lr 1.4258e-03 eta 1 day, 8:23:09
epoch [24/50] batch [940/2000] time 2.426 (2.196) data 0.000 (0.001) loss 0.0322 (1.1865) lr 1.4258e-03 eta 1 day, 8:21:42
epoch [24/50] batch [960/2000] time 2.419 (2.200) data 0.000 (0.001) loss 2.3548 (1.1888) lr 1.4258e-03 eta 1 day, 8:24:56
epoch [24/50] batch [980/2000] time 2.167 (2.199) data 0.000 (0.001) loss 0.8075 (1.1827) lr 1.4258e-03 eta 1 day, 8:23:29
epoch [24/50] batch [1000/2000] time 2.184 (2.198) data 0.001 (0.001) loss 1.5367 (1.1800) lr 1.4258e-03 eta 1 day, 8:21:53
epoch [24/50] batch [1020/2000] time 2.398 (2.202) data 0.000 (0.001) loss 1.1443 (1.1767) lr 1.4258e-03 eta 1 day, 8:24:41
epoch [24/50] batch [1040/2000] time 2.171 (2.202) data 0.000 (0.001) loss 1.7420 (1.1710) lr 1.4258e-03 eta 1 day, 8:23:38
epoch [24/50] batch [1060/2000] time 2.142 (2.201) data 0.000 (0.001) loss 0.9805 (1.1655) lr 1.4258e-03 eta 1 day, 8:21:52
epoch [24/50] batch [1080/2000] time 2.417 (2.204) data 0.000 (0.001) loss 1.7390 (1.1686) lr 1.4258e-03 eta 1 day, 8:24:10
epoch [24/50] batch [1100/2000] time 2.125 (2.204) data 0.000 (0.001) loss 1.4294 (1.1691) lr 1.4258e-03 eta 1 day, 8:23:25
epoch [24/50] batch [1120/2000] time 2.119 (2.203) data 0.000 (0.001) loss 1.4428 (1.1684) lr 1.4258e-03 eta 1 day, 8:21:45
epoch [24/50] batch [1140/2000] time 2.495 (2.206) data 0.001 (0.001) loss 0.7430 (1.1625) lr 1.4258e-03 eta 1 day, 8:23:54
epoch [24/50] batch [1160/2000] time 2.167 (2.207) data 0.000 (0.001) loss 2.7391 (1.1653) lr 1.4258e-03 eta 1 day, 8:23:13
epoch [24/50] batch [1180/2000] time 2.150 (2.205) data 0.000 (0.001) loss 0.5263 (1.1663) lr 1.4258e-03 eta 1 day, 8:21:23
epoch [24/50] batch [1200/2000] time 2.466 (2.208) data 0.000 (0.001) loss 1.0951 (1.1701) lr 1.4258e-03 eta 1 day, 8:23:22
epoch [24/50] batch [1220/2000] time 2.148 (2.208) data 0.000 (0.001) loss 0.9187 (1.1701) lr 1.4258e-03 eta 1 day, 8:22:41
epoch [24/50] batch [1240/2000] time 2.106 (2.207) data 0.000 (0.001) loss 2.5111 (1.1699) lr 1.4258e-03 eta 1 day, 8:20:58
epoch [24/50] batch [1260/2000] time 2.366 (2.210) data 0.000 (0.001) loss 0.2131 (1.1688) lr 1.4258e-03 eta 1 day, 8:22:27
epoch [24/50] batch [1280/2000] time 2.144 (2.210) data 0.000 (0.001) loss 0.8859 (1.1733) lr 1.4258e-03 eta 1 day, 8:21:48
epoch [24/50] batch [1300/2000] time 2.146 (2.209) data 0.000 (0.001) loss 0.4130 (1.1724) lr 1.4258e-03 eta 1 day, 8:20:11
epoch [24/50] batch [1320/2000] time 2.348 (2.211) data 0.000 (0.001) loss 2.0886 (1.1747) lr 1.4258e-03 eta 1 day, 8:21:35
epoch [24/50] batch [1340/2000] time 2.264 (2.212) data 0.000 (0.001) loss 1.4787 (1.1737) lr 1.4258e-03 eta 1 day, 8:21:32
epoch [24/50] batch [1360/2000] time 2.116 (2.214) data 0.000 (0.001) loss 0.2507 (1.1703) lr 1.4258e-03 eta 1 day, 8:22:35
epoch [24/50] batch [1380/2000] time 2.429 (2.220) data 0.000 (0.001) loss 1.3582 (1.1681) lr 1.4258e-03 eta 1 day, 8:26:57
epoch [24/50] batch [1400/2000] time 2.260 (2.222) data 0.000 (0.001) loss 0.1350 (1.1687) lr 1.4258e-03 eta 1 day, 8:28:12
epoch [24/50] batch [1420/2000] time 2.299 (2.225) data 0.000 (0.001) loss 1.8893 (1.1669) lr 1.4258e-03 eta 1 day, 8:29:47
epoch [24/50] batch [1440/2000] time 2.425 (2.231) data 0.000 (0.001) loss 3.2476 (1.1687) lr 1.4258e-03 eta 1 day, 8:34:46
epoch [24/50] batch [1460/2000] time 2.336 (2.233) data 0.001 (0.001) loss 0.5152 (1.1701) lr 1.4258e-03 eta 1 day, 8:35:10
epoch [24/50] batch [1480/2000] time 2.457 (2.236) data 0.000 (0.001) loss 1.8924 (1.1720) lr 1.4258e-03 eta 1 day, 8:37:26
epoch [24/50] batch [1500/2000] time 3.098 (2.242) data 0.000 (0.001) loss 0.6396 (1.1678) lr 1.4258e-03 eta 1 day, 8:41:21
epoch [24/50] batch [1520/2000] time 2.411 (2.244) data 0.000 (0.001) loss 0.7220 (1.1689) lr 1.4258e-03 eta 1 day, 8:42:29
epoch [24/50] batch [1540/2000] time 2.431 (2.247) data 0.000 (0.001) loss 0.8807 (1.1673) lr 1.4258e-03 eta 1 day, 8:44:15
epoch [24/50] batch [1560/2000] time 2.384 (2.249) data 0.000 (0.001) loss 0.5979 (1.1639) lr 1.4258e-03 eta 1 day, 8:46:02
epoch [24/50] batch [1580/2000] time 2.422 (2.250) data 0.000 (0.001) loss 0.2098 (1.1596) lr 1.4258e-03 eta 1 day, 8:46:10
epoch [24/50] batch [1600/2000] time 2.434 (2.254) data 0.000 (0.001) loss 0.2101 (1.1573) lr 1.4258e-03 eta 1 day, 8:48:15
epoch [24/50] batch [1620/2000] time 2.109 (2.257) data 0.000 (0.001) loss 0.1774 (1.1568) lr 1.4258e-03 eta 1 day, 8:49:56
epoch [24/50] batch [1640/2000] time 2.246 (2.257) data 0.000 (0.001) loss 0.9500 (1.1575) lr 1.4258e-03 eta 1 day, 8:49:37
epoch [24/50] batch [1660/2000] time 2.601 (2.260) data 0.000 (0.001) loss 0.1191 (1.1543) lr 1.4258e-03 eta 1 day, 8:51:42
epoch [24/50] batch [1680/2000] time 2.151 (2.262) data 0.001 (0.001) loss 1.0659 (1.1508) lr 1.4258e-03 eta 1 day, 8:52:35
epoch [24/50] batch [1700/2000] time 2.365 (2.263) data 0.000 (0.001) loss 1.7999 (1.1513) lr 1.4258e-03 eta 1 day, 8:52:10
epoch [24/50] batch [1720/2000] time 2.312 (2.266) data 0.000 (0.001) loss 1.2085 (1.1537) lr 1.4258e-03 eta 1 day, 8:54:08
epoch [24/50] batch [1740/2000] time 2.134 (2.267) data 0.000 (0.001) loss 3.4976 (1.1557) lr 1.4258e-03 eta 1 day, 8:54:30
epoch [24/50] batch [1760/2000] time 3.095 (2.268) data 0.000 (0.001) loss 1.8488 (1.1548) lr 1.4258e-03 eta 1 day, 8:54:40
epoch [24/50] batch [1780/2000] time 2.671 (2.271) data 0.000 (0.001) loss 1.0672 (1.1581) lr 1.4258e-03 eta 1 day, 8:56:46
epoch [24/50] batch [1800/2000] time 2.168 (2.272) data 0.000 (0.001) loss 0.8155 (1.1576) lr 1.4258e-03 eta 1 day, 8:56:59
epoch [24/50] batch [1820/2000] time 3.299 (2.274) data 0.000 (0.001) loss 1.1440 (1.1585) lr 1.4258e-03 eta 1 day, 8:57:29
epoch [24/50] batch [1840/2000] time 2.654 (2.277) data 0.000 (0.001) loss 1.1309 (1.1576) lr 1.4258e-03 eta 1 day, 8:59:23
epoch [24/50] batch [1860/2000] time 2.108 (2.278) data 0.000 (0.001) loss 0.0479 (1.1600) lr 1.4258e-03 eta 1 day, 8:59:18
epoch [24/50] batch [1880/2000] time 2.463 (2.279) data 0.000 (0.001) loss 0.6079 (1.1596) lr 1.4258e-03 eta 1 day, 8:59:40
epoch [24/50] batch [1900/2000] time 2.370 (2.282) data 0.000 (0.001) loss 0.7650 (1.1643) lr 1.4258e-03 eta 1 day, 9:01:20
epoch [24/50] batch [1920/2000] time 2.269 (2.282) data 0.000 (0.001) loss 1.1932 (1.1636) lr 1.4258e-03 eta 1 day, 9:00:46
epoch [24/50] batch [1940/2000] time 2.403 (2.283) data 0.000 (0.001) loss 1.7143 (1.1638) lr 1.4258e-03 eta 1 day, 9:00:50
epoch [24/50] batch [1960/2000] time 2.101 (2.286) data 0.000 (0.001) loss 0.6939 (1.1627) lr 1.4258e-03 eta 1 day, 9:02:18
epoch [24/50] batch [1980/2000] time 2.352 (2.285) data 0.000 (0.001) loss 2.3484 (1.1617) lr 1.4258e-03 eta 1 day, 9:01:17
epoch [24/50] batch [2000/2000] time 2.372 (2.286) data 0.000 (0.001) loss 1.9069 (1.1609) lr 1.3681e-03 eta 1 day, 9:01:36
epoch [25/50] batch [20/2000] time 2.349 (2.462) data 0.000 (0.037) loss 0.9646 (0.9741) lr 1.3681e-03 eta 1 day, 11:32:52
epoch [25/50] batch [40/2000] time 2.296 (2.368) data 0.000 (0.019) loss 0.2544 (1.1231) lr 1.3681e-03 eta 1 day, 10:10:44
epoch [25/50] batch [60/2000] time 3.102 (2.462) data 0.001 (0.013) loss 0.1987 (1.1410) lr 1.3681e-03 eta 1 day, 11:31:08
epoch [25/50] batch [80/2000] time 2.115 (2.521) data 0.000 (0.010) loss 1.1243 (1.0852) lr 1.3681e-03 eta 1 day, 12:21:41
epoch [25/50] batch [100/2000] time 2.116 (2.510) data 0.000 (0.008) loss 0.1474 (1.0507) lr 1.3681e-03 eta 1 day, 12:10:52
epoch [25/50] batch [120/2000] time 3.698 (2.576) data 0.000 (0.007) loss 0.0609 (1.0365) lr 1.3681e-03 eta 1 day, 13:07:01
epoch [25/50] batch [140/2000] time 2.185 (2.572) data 0.000 (0.006) loss 2.2075 (1.0954) lr 1.3681e-03 eta 1 day, 13:02:52
epoch [25/50] batch [160/2000] time 2.413 (2.568) data 0.007 (0.005) loss 0.0079 (1.1063) lr 1.3681e-03 eta 1 day, 12:58:50
epoch [25/50] batch [180/2000] time 3.494 (2.600) data 0.000 (0.005) loss 1.1386 (1.0805) lr 1.3681e-03 eta 1 day, 13:25:44
epoch [25/50] batch [200/2000] time 2.091 (2.609) data 0.000 (0.004) loss 0.4840 (1.0811) lr 1.3681e-03 eta 1 day, 13:32:33
epoch [25/50] batch [220/2000] time 2.450 (2.617) data 0.000 (0.004) loss 0.5864 (1.0634) lr 1.3681e-03 eta 1 day, 13:38:39
epoch [25/50] batch [240/2000] time 2.254 (2.621) data 0.001 (0.004) loss 0.2757 (1.0563) lr 1.3681e-03 eta 1 day, 13:41:27
epoch [25/50] batch [260/2000] time 3.456 (2.623) data 0.000 (0.003) loss 1.9279 (1.0824) lr 1.3681e-03 eta 1 day, 13:41:45
epoch [25/50] batch [280/2000] time 2.381 (2.642) data 0.000 (0.003) loss 1.4143 (1.0917) lr 1.3681e-03 eta 1 day, 13:56:59
epoch [25/50] batch [300/2000] time 2.341 (2.627) data 0.000 (0.003) loss 0.2409 (1.1198) lr 1.3681e-03 eta 1 day, 13:43:27
epoch [25/50] batch [320/2000] time 2.395 (2.625) data 0.000 (0.003) loss 0.4009 (1.1141) lr 1.3681e-03 eta 1 day, 13:40:43
epoch [25/50] batch [340/2000] time 2.313 (2.625) data 0.000 (0.003) loss 0.9924 (1.1020) lr 1.3681e-03 eta 1 day, 13:39:51
epoch [25/50] batch [360/2000] time 2.175 (2.622) data 0.001 (0.003) loss 2.8023 (1.0878) lr 1.3681e-03 eta 1 day, 13:36:18
epoch [25/50] batch [380/2000] time 2.557 (2.613) data 0.000 (0.002) loss 1.2618 (1.0828) lr 1.3681e-03 eta 1 day, 13:28:11
epoch [25/50] batch [400/2000] time 2.237 (2.616) data 0.000 (0.002) loss 1.9941 (1.0992) lr 1.3681e-03 eta 1 day, 13:29:29
epoch [25/50] batch [420/2000] time 3.188 (2.612) data 0.000 (0.002) loss 1.1568 (1.1197) lr 1.3681e-03 eta 1 day, 13:25:26
epoch [25/50] batch [440/2000] time 2.387 (2.607) data 0.000 (0.002) loss 0.3843 (1.1273) lr 1.3681e-03 eta 1 day, 13:19:52
epoch [25/50] batch [460/2000] time 2.198 (2.608) data 0.000 (0.002) loss 3.1101 (1.1296) lr 1.3681e-03 eta 1 day, 13:20:21
epoch [25/50] batch [480/2000] time 2.255 (2.599) data 0.000 (0.002) loss 0.1009 (1.1305) lr 1.3681e-03 eta 1 day, 13:12:04
epoch [25/50] batch [500/2000] time 2.518 (2.592) data 0.000 (0.002) loss 1.4353 (1.1319) lr 1.3681e-03 eta 1 day, 13:04:23
epoch [25/50] batch [520/2000] time 2.517 (2.595) data 0.000 (0.002) loss 0.6546 (1.1383) lr 1.3681e-03 eta 1 day, 13:06:07
epoch [25/50] batch [540/2000] time 2.312 (2.585) data 0.000 (0.002) loss 2.0550 (1.1492) lr 1.3681e-03 eta 1 day, 12:57:04
epoch [25/50] batch [560/2000] time 2.186 (2.576) data 0.000 (0.002) loss 0.2631 (1.1392) lr 1.3681e-03 eta 1 day, 12:48:14
epoch [25/50] batch [580/2000] time 2.355 (2.575) data 0.015 (0.002) loss 0.7999 (1.1474) lr 1.3681e-03 eta 1 day, 12:47:09
epoch [25/50] batch [600/2000] time 2.240 (2.570) data 0.001 (0.002) loss 2.4570 (1.1436) lr 1.3681e-03 eta 1 day, 12:41:30
epoch [25/50] batch [620/2000] time 2.279 (2.563) data 0.000 (0.002) loss 0.6081 (1.1444) lr 1.3681e-03 eta 1 day, 12:34:33
epoch [25/50] batch [640/2000] time 2.443 (2.560) data 0.000 (0.002) loss 0.4785 (1.1435) lr 1.3681e-03 eta 1 day, 12:31:40
epoch [25/50] batch [660/2000] time 2.912 (2.560) data 0.000 (0.002) loss 0.6911 (1.1345) lr 1.3681e-03 eta 1 day, 12:30:38
epoch [25/50] batch [680/2000] time 2.909 (2.555) data 0.000 (0.002) loss 2.8861 (1.1349) lr 1.3681e-03 eta 1 day, 12:25:28
epoch [25/50] batch [700/2000] time 3.150 (2.554) data 0.000 (0.002) loss 0.6160 (1.1340) lr 1.3681e-03 eta 1 day, 12:23:40
epoch [25/50] batch [720/2000] time 2.992 (2.555) data 0.000 (0.002) loss 2.3881 (1.1352) lr 1.3681e-03 eta 1 day, 12:23:48
epoch [25/50] batch [740/2000] time 2.915 (2.550) data 0.000 (0.002) loss 0.6215 (1.1342) lr 1.3681e-03 eta 1 day, 12:18:15
epoch [25/50] batch [760/2000] time 3.294 (2.549) data 0.000 (0.002) loss 0.9091 (1.1361) lr 1.3681e-03 eta 1 day, 12:16:52
epoch [25/50] batch [780/2000] time 2.079 (2.549) data 0.000 (0.001) loss 0.2713 (1.1357) lr 1.3681e-03 eta 1 day, 12:15:36
epoch [25/50] batch [800/2000] time 2.133 (2.542) data 0.000 (0.001) loss 1.0571 (1.1420) lr 1.3681e-03 eta 1 day, 12:09:18
epoch [25/50] batch [820/2000] time 2.372 (2.538) data 0.000 (0.001) loss 0.9054 (1.1399) lr 1.3681e-03 eta 1 day, 12:04:44
epoch [25/50] batch [840/2000] time 2.546 (2.538) data 0.000 (0.001) loss 2.9533 (1.1444) lr 1.3681e-03 eta 1 day, 12:04:09
epoch [25/50] batch [860/2000] time 2.281 (2.533) data 0.000 (0.001) loss 0.2524 (1.1612) lr 1.3681e-03 eta 1 day, 11:58:39
epoch [25/50] batch [880/2000] time 2.990 (2.529) data 0.000 (0.001) loss 1.4218 (1.1609) lr 1.3681e-03 eta 1 day, 11:54:47
epoch [25/50] batch [900/2000] time 2.363 (2.530) data 0.000 (0.001) loss 0.8135 (1.1677) lr 1.3681e-03 eta 1 day, 11:54:35
epoch [25/50] batch [920/2000] time 2.444 (2.526) data 0.000 (0.001) loss 0.3593 (1.1641) lr 1.3681e-03 eta 1 day, 11:50:34
epoch [25/50] batch [940/2000] time 2.094 (2.521) data 0.000 (0.001) loss 1.2787 (1.1732) lr 1.3681e-03 eta 1 day, 11:45:28
epoch [25/50] batch [960/2000] time 2.529 (2.521) data 0.000 (0.001) loss 0.3337 (1.1785) lr 1.3681e-03 eta 1 day, 11:44:15
epoch [25/50] batch [980/2000] time 2.260 (2.518) data 0.000 (0.001) loss 1.0519 (1.1732) lr 1.3681e-03 eta 1 day, 11:41:00
epoch [25/50] batch [1000/2000] time 2.663 (2.514) data 0.000 (0.001) loss 0.3140 (1.1689) lr 1.3681e-03 eta 1 day, 11:36:48
epoch [25/50] batch [1020/2000] time 2.656 (2.514) data 0.000 (0.001) loss 0.2198 (1.1684) lr 1.3681e-03 eta 1 day, 11:35:43
epoch [25/50] batch [1040/2000] time 2.871 (2.515) data 0.000 (0.001) loss 2.5272 (1.1689) lr 1.3681e-03 eta 1 day, 11:35:55
epoch [25/50] batch [1060/2000] time 2.956 (2.523) data 0.000 (0.001) loss 4.0409 (1.1803) lr 1.3681e-03 eta 1 day, 11:41:41
epoch [25/50] batch [1080/2000] time 3.294 (2.524) data 0.000 (0.001) loss 0.2614 (1.1751) lr 1.3681e-03 eta 1 day, 11:42:04
epoch [25/50] batch [1100/2000] time 2.879 (2.534) data 0.000 (0.001) loss 0.3366 (1.1803) lr 1.3681e-03 eta 1 day, 11:49:29
epoch [25/50] batch [1120/2000] time 2.279 (2.531) data 0.000 (0.001) loss 1.3812 (1.1757) lr 1.3681e-03 eta 1 day, 11:45:53
epoch [25/50] batch [1140/2000] time 3.328 (2.543) data 0.001 (0.001) loss 0.2737 (1.1683) lr 1.3681e-03 eta 1 day, 11:55:44
epoch [25/50] batch [1160/2000] time 2.235 (2.542) data 0.000 (0.001) loss 0.8652 (1.1635) lr 1.3681e-03 eta 1 day, 11:53:49
epoch [25/50] batch [1180/2000] time 3.269 (2.547) data 0.000 (0.001) loss 0.8104 (1.1713) lr 1.3681e-03 eta 1 day, 11:57:31
epoch [25/50] batch [1200/2000] time 2.316 (2.555) data 0.000 (0.001) loss 1.8603 (1.1671) lr 1.3681e-03 eta 1 day, 12:03:08
epoch [25/50] batch [1220/2000] time 2.819 (2.556) data 0.000 (0.001) loss 0.1812 (1.1667) lr 1.3681e-03 eta 1 day, 12:02:50
epoch [25/50] batch [1240/2000] time 2.785 (2.561) data 0.000 (0.001) loss 0.3511 (1.1690) lr 1.3681e-03 eta 1 day, 12:06:22
epoch [25/50] batch [1260/2000] time 2.802 (2.556) data 0.000 (0.001) loss 0.8913 (1.1726) lr 1.3681e-03 eta 1 day, 12:01:26
epoch [25/50] batch [1280/2000] time 2.770 (2.559) data 0.000 (0.001) loss 1.7439 (1.1711) lr 1.3681e-03 eta 1 day, 12:03:24
epoch [25/50] batch [1300/2000] time 2.058 (2.558) data 0.000 (0.001) loss 3.7109 (1.1711) lr 1.3681e-03 eta 1 day, 12:01:43
epoch [25/50] batch [1320/2000] time 2.725 (2.558) data 0.000 (0.001) loss 1.9243 (1.1740) lr 1.3681e-03 eta 1 day, 12:00:36
epoch [25/50] batch [1340/2000] time 2.800 (2.561) data 0.000 (0.001) loss 1.2589 (1.1730) lr 1.3681e-03 eta 1 day, 12:02:35
epoch [25/50] batch [1360/2000] time 2.173 (2.558) data 0.016 (0.001) loss 0.1891 (1.1763) lr 1.3681e-03 eta 1 day, 11:58:53
epoch [25/50] batch [1380/2000] time 2.816 (2.560) data 0.000 (0.001) loss 0.3914 (1.1751) lr 1.3681e-03 eta 1 day, 12:00:03
epoch [25/50] batch [1400/2000] time 2.754 (2.564) data 0.000 (0.001) loss 1.4385 (1.1758) lr 1.3681e-03 eta 1 day, 12:01:53
epoch [25/50] batch [1420/2000] time 2.803 (2.559) data 0.000 (0.001) loss 0.3564 (1.1690) lr 1.3681e-03 eta 1 day, 11:57:20
epoch [25/50] batch [1440/2000] time 2.791 (2.562) data 0.000 (0.001) loss 1.9205 (1.1686) lr 1.3681e-03 eta 1 day, 11:58:50
epoch [25/50] batch [1460/2000] time 2.046 (2.563) data 0.000 (0.001) loss 0.2041 (1.1723) lr 1.3681e-03 eta 1 day, 11:58:41
epoch [25/50] batch [1480/2000] time 2.867 (2.561) data 0.000 (0.001) loss 1.7964 (1.1718) lr 1.3681e-03 eta 1 day, 11:56:40
epoch [25/50] batch [1500/2000] time 2.763 (2.564) data 0.000 (0.001) loss 0.2644 (1.1741) lr 1.3681e-03 eta 1 day, 11:58:02
epoch [25/50] batch [1520/2000] time 2.321 (2.564) data 0.000 (0.001) loss 0.4387 (1.1810) lr 1.3681e-03 eta 1 day, 11:56:48
epoch [25/50] batch [1540/2000] time 2.755 (2.562) data 0.000 (0.001) loss 1.9396 (1.1795) lr 1.3681e-03 eta 1 day, 11:54:54
epoch [25/50] batch [1560/2000] time 2.725 (2.565) data 0.013 (0.001) loss 0.3425 (1.1775) lr 1.3681e-03 eta 1 day, 11:55:56
epoch [25/50] batch [1580/2000] time 2.069 (2.564) data 0.000 (0.001) loss 1.1602 (1.1790) lr 1.3681e-03 eta 1 day, 11:54:54
epoch [25/50] batch [1600/2000] time 2.669 (2.563) data 0.000 (0.001) loss 2.2061 (1.1830) lr 1.3681e-03 eta 1 day, 11:52:34
epoch [25/50] batch [1620/2000] time 2.728 (2.565) data 0.000 (0.001) loss 2.3097 (1.1852) lr 1.3681e-03 eta 1 day, 11:53:41
epoch [25/50] batch [1640/2000] time 2.073 (2.565) data 0.000 (0.001) loss 1.3159 (1.1855) lr 1.3681e-03 eta 1 day, 11:53:15
epoch [25/50] batch [1660/2000] time 2.716 (2.563) data 0.000 (0.001) loss 0.5595 (1.1877) lr 1.3681e-03 eta 1 day, 11:50:44
epoch [25/50] batch [1680/2000] time 2.782 (2.566) data 0.001 (0.001) loss 0.6407 (1.1858) lr 1.3681e-03 eta 1 day, 11:51:47
epoch [25/50] batch [1700/2000] time 2.704 (2.568) data 0.000 (0.001) loss 1.7877 (1.1837) lr 1.3681e-03 eta 1 day, 11:52:33
epoch [25/50] batch [1720/2000] time 2.725 (2.564) data 0.000 (0.001) loss 0.9690 (1.1914) lr 1.3681e-03 eta 1 day, 11:48:39
epoch [25/50] batch [1740/2000] time 2.660 (2.566) data 0.000 (0.001) loss 0.9490 (1.1905) lr 1.3681e-03 eta 1 day, 11:49:22
epoch [25/50] batch [1760/2000] time 2.706 (2.568) data 0.000 (0.001) loss 0.9976 (1.1900) lr 1.3681e-03 eta 1 day, 11:50:15
epoch [25/50] batch [1780/2000] time 2.136 (2.566) data 0.000 (0.001) loss 1.8571 (1.1910) lr 1.3681e-03 eta 1 day, 11:47:20
epoch [25/50] batch [1800/2000] time 2.803 (2.566) data 0.000 (0.001) loss 0.6509 (1.1915) lr 1.3681e-03 eta 1 day, 11:47:10
epoch [25/50] batch [1820/2000] time 2.756 (2.568) data 0.000 (0.001) loss 3.3331 (1.1954) lr 1.3681e-03 eta 1 day, 11:48:02
epoch [25/50] batch [1840/2000] time 2.284 (2.568) data 0.000 (0.001) loss 0.3137 (1.1947) lr 1.3681e-03 eta 1 day, 11:46:47
epoch [25/50] batch [1860/2000] time 2.814 (2.567) data 0.000 (0.001) loss 0.2539 (1.1898) lr 1.3681e-03 eta 1 day, 11:44:58
epoch [25/50] batch [1880/2000] time 2.031 (2.566) data 0.000 (0.001) loss 0.2994 (1.1873) lr 1.3681e-03 eta 1 day, 11:43:34
epoch [25/50] batch [1900/2000] time 2.650 (2.565) data 0.000 (0.001) loss 0.7663 (1.1876) lr 1.3681e-03 eta 1 day, 11:41:41
epoch [25/50] batch [1920/2000] time 2.068 (2.565) data 0.000 (0.001) loss 1.1366 (1.1877) lr 1.3681e-03 eta 1 day, 11:40:38
epoch [25/50] batch [1940/2000] time 2.748 (2.563) data 0.000 (0.001) loss 1.4725 (1.1848) lr 1.3681e-03 eta 1 day, 11:38:31
epoch [25/50] batch [1960/2000] time 2.018 (2.563) data 0.000 (0.001) loss 2.1657 (1.1904) lr 1.3681e-03 eta 1 day, 11:37:42
epoch [25/50] batch [1980/2000] time 2.764 (2.562) data 0.000 (0.001) loss 1.7697 (1.1918) lr 1.3681e-03 eta 1 day, 11:35:40
epoch [25/50] batch [2000/2000] time 2.019 (2.562) data 0.000 (0.001) loss 1.1206 (1.1922) lr 1.3090e-03 eta 1 day, 11:34:52
epoch [26/50] batch [20/2000] time 2.727 (2.551) data 0.016 (0.053) loss 2.2170 (1.0924) lr 1.3090e-03 eta 1 day, 11:25:09
epoch [26/50] batch [40/2000] time 2.285 (2.517) data 0.000 (0.027) loss 2.3391 (1.2698) lr 1.3090e-03 eta 1 day, 10:55:58
epoch [26/50] batch [60/2000] time 2.773 (2.507) data 0.001 (0.018) loss 1.5571 (1.2749) lr 1.3090e-03 eta 1 day, 10:46:20
epoch [26/50] batch [80/2000] time 2.331 (2.507) data 0.000 (0.014) loss 1.2149 (1.2300) lr 1.3090e-03 eta 1 day, 10:46:00
epoch [26/50] batch [100/2000] time 2.662 (2.498) data 0.000 (0.011) loss 0.7464 (1.2455) lr 1.3090e-03 eta 1 day, 10:37:16
epoch [26/50] batch [120/2000] time 2.201 (2.502) data 0.000 (0.009) loss 0.3380 (1.2102) lr 1.3090e-03 eta 1 day, 10:40:06
epoch [26/50] batch [140/2000] time 2.663 (2.494) data 0.000 (0.008) loss 0.7819 (1.2168) lr 1.3090e-03 eta 1 day, 10:32:46
epoch [26/50] batch [160/2000] time 2.004 (2.500) data 0.000 (0.007) loss 1.4575 (1.1994) lr 1.3090e-03 eta 1 day, 10:36:20
epoch [26/50] batch [180/2000] time 2.687 (2.488) data 0.000 (0.006) loss 1.0211 (1.2017) lr 1.3090e-03 eta 1 day, 10:26:16
epoch [26/50] batch [200/2000] time 2.077 (2.499) data 0.000 (0.006) loss 2.8455 (1.1885) lr 1.3090e-03 eta 1 day, 10:34:11
epoch [26/50] batch [220/2000] time 2.656 (2.489) data 0.000 (0.005) loss 0.2328 (1.1865) lr 1.3090e-03 eta 1 day, 10:24:51
epoch [26/50] batch [240/2000] time 2.060 (2.499) data 0.005 (0.005) loss 1.1763 (1.1986) lr 1.3090e-03 eta 1 day, 10:32:12
epoch [26/50] batch [260/2000] time 2.669 (2.488) data 0.000 (0.005) loss 2.6821 (1.2165) lr 1.3090e-03 eta 1 day, 10:22:37
epoch [26/50] batch [280/2000] time 2.072 (2.499) data 0.000 (0.004) loss 1.7038 (1.2227) lr 1.3090e-03 eta 1 day, 10:30:25
epoch [26/50] batch [300/2000] time 2.751 (2.489) data 0.000 (0.004) loss 0.0343 (1.2109) lr 1.3090e-03 eta 1 day, 10:21:56
epoch [26/50] batch [320/2000] time 2.048 (2.498) data 0.000 (0.004) loss 1.5534 (1.2209) lr 1.3090e-03 eta 1 day, 10:28:26
epoch [26/50] batch [340/2000] time 2.783 (2.488) data 0.000 (0.004) loss 0.1621 (1.2109) lr 1.3090e-03 eta 1 day, 10:19:18
epoch [26/50] batch [360/2000] time 2.080 (2.498) data 0.000 (0.004) loss 0.4637 (1.2035) lr 1.3090e-03 eta 1 day, 10:26:50
epoch [26/50] batch [380/2000] time 2.707 (2.488) data 0.000 (0.003) loss 0.5272 (1.2126) lr 1.3090e-03 eta 1 day, 10:17:41
epoch [26/50] batch [400/2000] time 2.072 (2.498) data 0.000 (0.003) loss 1.0964 (1.2114) lr 1.3090e-03 eta 1 day, 10:25:03
epoch [26/50] batch [420/2000] time 2.686 (2.488) data 0.000 (0.003) loss 0.3551 (1.2004) lr 1.3090e-03 eta 1 day, 10:16:02
epoch [26/50] batch [440/2000] time 2.074 (2.496) data 0.000 (0.003) loss 1.4692 (1.2064) lr 1.3090e-03 eta 1 day, 10:21:41
epoch [26/50] batch [460/2000] time 2.784 (2.485) data 0.000 (0.003) loss 2.1780 (1.2074) lr 1.3090e-03 eta 1 day, 10:12:05
epoch [26/50] batch [480/2000] time 2.883 (2.499) data 0.000 (0.003) loss 0.0875 (1.2018) lr 1.3090e-03 eta 1 day, 10:22:38
epoch [26/50] batch [500/2000] time 2.749 (2.511) data 0.000 (0.003) loss 2.0903 (1.2051) lr 1.3090e-03 eta 1 day, 10:31:53
epoch [26/50] batch [520/2000] time 2.796 (2.524) data 0.000 (0.003) loss 1.4702 (1.2080) lr 1.3090e-03 eta 1 day, 10:41:14
epoch [26/50] batch [540/2000] time 2.165 (2.514) data 0.000 (0.003) loss 2.1508 (1.2145) lr 1.3090e-03 eta 1 day, 10:32:07
epoch [26/50] batch [560/2000] time 2.827 (2.521) data 0.000 (0.003) loss 1.8093 (1.2099) lr 1.3090e-03 eta 1 day, 10:37:16
epoch [26/50] batch [580/2000] time 2.705 (2.531) data 0.000 (0.002) loss 0.7253 (1.2159) lr 1.3090e-03 eta 1 day, 10:44:46
epoch [26/50] batch [600/2000] time 2.742 (2.539) data 0.000 (0.002) loss 2.1322 (1.2213) lr 1.3090e-03 eta 1 day, 10:50:18
epoch [26/50] batch [620/2000] time 2.019 (2.538) data 0.000 (0.002) loss 0.0981 (1.2092) lr 1.3090e-03 eta 1 day, 10:48:55
epoch [26/50] batch [640/2000] time 2.855 (2.536) data 0.000 (0.002) loss 1.8800 (1.2076) lr 1.3090e-03 eta 1 day, 10:46:34
epoch [26/50] batch [660/2000] time 2.814 (2.546) data 0.000 (0.002) loss 1.3264 (1.2027) lr 1.3090e-03 eta 1 day, 10:53:15
epoch [26/50] batch [680/2000] time 2.860 (2.553) data 0.000 (0.002) loss 1.3995 (1.2013) lr 1.3090e-03 eta 1 day, 10:58:55
epoch [26/50] batch [700/2000] time 2.088 (2.560) data 0.000 (0.002) loss 2.2763 (1.1985) lr 1.3090e-03 eta 1 day, 11:03:27
epoch [26/50] batch [720/2000] time 2.768 (2.552) data 0.000 (0.002) loss 0.2071 (1.1966) lr 1.3090e-03 eta 1 day, 10:55:51
epoch [26/50] batch [740/2000] time 2.891 (2.558) data 0.000 (0.002) loss 1.2009 (1.1909) lr 1.3090e-03 eta 1 day, 11:00:23
epoch [26/50] batch [760/2000] time 2.877 (2.565) data 0.000 (0.002) loss 1.4919 (1.2017) lr 1.3090e-03 eta 1 day, 11:05:02
epoch [26/50] batch [780/2000] time 2.746 (2.571) data 0.000 (0.002) loss 0.2785 (1.1969) lr 1.3090e-03 eta 1 day, 11:09:11
epoch [26/50] batch [800/2000] time 2.771 (2.577) data 0.000 (0.002) loss 1.6851 (1.1972) lr 1.3090e-03 eta 1 day, 11:13:00
epoch [26/50] batch [820/2000] time 2.858 (2.568) data 0.000 (0.002) loss 1.7507 (1.1983) lr 1.3090e-03 eta 1 day, 11:04:53
epoch [26/50] batch [840/2000] time 2.786 (2.573) data 0.000 (0.002) loss 0.6027 (1.1921) lr 1.3090e-03 eta 1 day, 11:08:15
epoch [26/50] batch [860/2000] time 2.730 (2.578) data 0.000 (0.002) loss 2.3214 (1.1946) lr 1.3090e-03 eta 1 day, 11:11:15
epoch [26/50] batch [880/2000] time 2.764 (2.582) data 0.000 (0.002) loss 1.4647 (1.1974) lr 1.3090e-03 eta 1 day, 11:14:10
epoch [26/50] batch [900/2000] time 2.816 (2.588) data 0.000 (0.002) loss 0.2490 (1.2005) lr 1.3090e-03 eta 1 day, 11:17:33
epoch [26/50] batch [920/2000] time 2.179 (2.580) data 0.000 (0.002) loss 0.7996 (1.2036) lr 1.3090e-03 eta 1 day, 11:10:11
epoch [26/50] batch [940/2000] time 2.799 (2.585) data 0.000 (0.002) loss 1.6531 (1.1983) lr 1.3090e-03 eta 1 day, 11:13:31
epoch [26/50] batch [960/2000] time 2.836 (2.590) data 0.000 (0.002) loss 0.2555 (1.1935) lr 1.3090e-03 eta 1 day, 11:16:38
epoch [26/50] batch [980/2000] time 2.783 (2.594) data 0.018 (0.002) loss 1.0969 (1.1954) lr 1.3090e-03 eta 1 day, 11:19:05
epoch [26/50] batch [1000/2000] time 2.780 (2.598) data 0.000 (0.002) loss 0.4512 (1.1924) lr 1.3090e-03 eta 1 day, 11:21:38
epoch [26/50] batch [1020/2000] time 2.220 (2.591) data 0.000 (0.002) loss 0.5122 (1.1928) lr 1.3090e-03 eta 1 day, 11:15:02
epoch [26/50] batch [1040/2000] time 2.839 (2.595) data 0.000 (0.002) loss 1.8744 (1.1952) lr 1.3090e-03 eta 1 day, 11:17:18
epoch [26/50] batch [1060/2000] time 3.094 (2.600) data 0.015 (0.002) loss 0.5837 (1.1928) lr 1.3090e-03 eta 1 day, 11:20:55
epoch [26/50] batch [1080/2000] time 2.745 (2.606) data 0.000 (0.002) loss 0.6054 (1.1951) lr 1.3090e-03 eta 1 day, 11:24:56
epoch [26/50] batch [1100/2000] time 3.189 (2.611) data 0.000 (0.002) loss 2.0913 (1.1928) lr 1.3090e-03 eta 1 day, 11:27:40
epoch [26/50] batch [1120/2000] time 2.273 (2.610) data 0.000 (0.002) loss 1.8677 (1.1906) lr 1.3090e-03 eta 1 day, 11:26:39
epoch [26/50] batch [1140/2000] time 3.002 (2.612) data 0.001 (0.002) loss 1.4935 (1.1889) lr 1.3090e-03 eta 1 day, 11:26:58
epoch [26/50] batch [1160/2000] time 3.184 (2.621) data 0.000 (0.002) loss 3.0765 (1.1918) lr 1.3090e-03 eta 1 day, 11:33:34
epoch [26/50] batch [1180/2000] time 3.081 (2.627) data 0.000 (0.002) loss 0.9222 (1.1921) lr 1.3090e-03 eta 1 day, 11:37:31
epoch [26/50] batch [1200/2000] time 2.933 (2.633) data 0.000 (0.002) loss 2.1149 (1.1898) lr 1.3090e-03 eta 1 day, 11:41:16
epoch [26/50] batch [1220/2000] time 2.159 (2.630) data 0.000 (0.002) loss 0.1852 (1.1840) lr 1.3090e-03 eta 1 day, 11:37:58
epoch [26/50] batch [1240/2000] time 2.877 (2.632) data 0.000 (0.002) loss 2.1644 (1.1829) lr 1.3090e-03 eta 1 day, 11:39:10
epoch [26/50] batch [1260/2000] time 2.950 (2.637) data 0.000 (0.002) loss 2.0003 (1.1848) lr 1.3090e-03 eta 1 day, 11:42:30
epoch [26/50] batch [1280/2000] time 2.945 (2.643) data 0.000 (0.002) loss 2.7316 (1.1804) lr 1.3090e-03 eta 1 day, 11:45:46
epoch [26/50] batch [1300/2000] time 2.971 (2.647) data 0.000 (0.002) loss 3.5345 (1.1769) lr 1.3090e-03 eta 1 day, 11:48:48
epoch [26/50] batch [1320/2000] time 2.094 (2.646) data 0.003 (0.002) loss 0.3302 (1.1747) lr 1.3090e-03 eta 1 day, 11:46:58
epoch [26/50] batch [1340/2000] time 3.119 (2.648) data 0.000 (0.002) loss 1.0590 (1.1792) lr 1.3090e-03 eta 1 day, 11:47:40
epoch [26/50] batch [1360/2000] time 3.155 (2.654) data 0.000 (0.002) loss 3.4204 (1.1821) lr 1.3090e-03 eta 1 day, 11:51:24
epoch [26/50] batch [1380/2000] time 2.857 (2.659) data 0.000 (0.001) loss 0.1271 (1.1832) lr 1.3090e-03 eta 1 day, 11:54:46
epoch [26/50] batch [1400/2000] time 2.807 (2.662) data 0.000 (0.001) loss 3.6091 (1.1846) lr 1.3090e-03 eta 1 day, 11:56:09
epoch [26/50] batch [1420/2000] time 2.880 (2.665) data 0.000 (0.001) loss 1.5216 (1.1874) lr 1.3090e-03 eta 1 day, 11:57:34
epoch [26/50] batch [1440/2000] time 2.255 (2.659) data 0.000 (0.001) loss 1.7498 (1.1871) lr 1.3090e-03 eta 1 day, 11:52:16
epoch [26/50] batch [1460/2000] time 3.203 (2.663) data 0.000 (0.001) loss 3.0846 (1.1885) lr 1.3090e-03 eta 1 day, 11:54:17
epoch [26/50] batch [1480/2000] time 3.076 (2.667) data 0.000 (0.001) loss 0.9501 (1.1893) lr 1.3090e-03 eta 1 day, 11:57:02
epoch [26/50] batch [1500/2000] time 2.749 (2.670) data 0.000 (0.001) loss 1.0533 (1.1888) lr 1.3090e-03 eta 1 day, 11:58:24
epoch [26/50] batch [1520/2000] time 2.955 (2.673) data 0.000 (0.001) loss 1.3887 (1.1885) lr 1.3090e-03 eta 1 day, 11:59:42
epoch [26/50] batch [1540/2000] time 2.814 (2.676) data 0.000 (0.001) loss 0.0852 (1.1855) lr 1.3090e-03 eta 1 day, 12:01:03
epoch [26/50] batch [1560/2000] time 2.261 (2.671) data 0.000 (0.001) loss 2.1654 (1.1853) lr 1.3090e-03 eta 1 day, 11:56:27
epoch [26/50] batch [1580/2000] time 2.794 (2.673) data 0.000 (0.001) loss 1.4013 (1.1869) lr 1.3090e-03 eta 1 day, 11:57:08
epoch [26/50] batch [1600/2000] time 3.148 (2.677) data 0.000 (0.001) loss 0.1890 (1.1865) lr 1.3090e-03 eta 1 day, 11:59:02
epoch [26/50] batch [1620/2000] time 3.001 (2.681) data 0.000 (0.001) loss 1.2572 (1.1842) lr 1.3090e-03 eta 1 day, 12:01:51
epoch [26/50] batch [1640/2000] time 2.896 (2.684) data 0.000 (0.001) loss 1.5482 (1.1838) lr 1.3090e-03 eta 1 day, 12:03:03
epoch [26/50] batch [1660/2000] time 2.944 (2.686) data 0.000 (0.001) loss 0.7944 (1.1826) lr 1.3090e-03 eta 1 day, 12:04:19
epoch [26/50] batch [1680/2000] time 2.045 (2.683) data 0.001 (0.001) loss 0.1356 (1.1821) lr 1.3090e-03 eta 1 day, 12:01:00
epoch [26/50] batch [1700/2000] time 2.940 (2.684) data 0.000 (0.001) loss 0.3034 (1.1857) lr 1.3090e-03 eta 1 day, 12:00:42
epoch [26/50] batch [1720/2000] time 2.843 (2.687) data 0.000 (0.001) loss 1.0514 (1.1867) lr 1.3090e-03 eta 1 day, 12:01:47
epoch [26/50] batch [1740/2000] time 2.823 (2.689) data 0.000 (0.001) loss 1.2053 (1.1924) lr 1.3090e-03 eta 1 day, 12:02:45
epoch [26/50] batch [1760/2000] time 3.014 (2.691) data 0.000 (0.001) loss 1.1941 (1.1945) lr 1.3090e-03 eta 1 day, 12:03:45
epoch [26/50] batch [1780/2000] time 2.837 (2.694) data 0.000 (0.001) loss 2.0010 (1.1917) lr 1.3090e-03 eta 1 day, 12:04:48
epoch [26/50] batch [1800/2000] time 2.932 (2.696) data 0.014 (0.001) loss 1.0548 (1.1948) lr 1.3090e-03 eta 1 day, 12:05:46
epoch [26/50] batch [1820/2000] time 2.046 (2.697) data 0.000 (0.001) loss 1.1307 (1.1951) lr 1.3090e-03 eta 1 day, 12:05:40
epoch [26/50] batch [1840/2000] time 3.053 (2.693) data 0.000 (0.001) loss 1.3909 (1.1948) lr 1.3090e-03 eta 1 day, 12:01:52
epoch [26/50] batch [1860/2000] time 2.781 (2.695) data 0.005 (0.001) loss 0.3238 (1.1941) lr 1.3090e-03 eta 1 day, 12:02:34
epoch [26/50] batch [1880/2000] time 3.013 (2.697) data 0.014 (0.001) loss 1.9196 (1.1935) lr 1.3090e-03 eta 1 day, 12:03:17
epoch [26/50] batch [1900/2000] time 2.919 (2.699) data 0.000 (0.001) loss 0.9300 (1.1940) lr 1.3090e-03 eta 1 day, 12:04:03
epoch [26/50] batch [1920/2000] time 2.880 (2.702) data 0.000 (0.001) loss 0.0544 (1.1942) lr 1.3090e-03 eta 1 day, 12:04:57
epoch [26/50] batch [1940/2000] time 2.762 (2.703) data 0.000 (0.001) loss 2.3884 (1.1920) lr 1.3090e-03 eta 1 day, 12:05:25
epoch [26/50] batch [1960/2000] time 2.822 (2.705) data 0.014 (0.001) loss 1.0002 (1.1917) lr 1.3090e-03 eta 1 day, 12:06:07
epoch [26/50] batch [1980/2000] time 2.173 (2.702) data 0.000 (0.001) loss 2.3371 (1.1905) lr 1.3090e-03 eta 1 day, 12:02:17
epoch [26/50] batch [2000/2000] time 2.877 (2.703) data 0.000 (0.001) loss 1.3076 (1.1884) lr 1.2487e-03 eta 1 day, 12:02:06
epoch [27/50] batch [20/2000] time 2.842 (2.947) data 0.000 (0.036) loss 1.3886 (0.9484) lr 1.2487e-03 eta 1 day, 15:16:46
epoch [27/50] batch [40/2000] time 2.947 (2.924) data 0.000 (0.018) loss 0.9618 (1.0509) lr 1.2487e-03 eta 1 day, 14:56:59
epoch [27/50] batch [60/2000] time 2.970 (2.928) data 0.001 (0.012) loss 1.7716 (1.1031) lr 1.2487e-03 eta 1 day, 14:59:11
epoch [27/50] batch [80/2000] time 3.000 (2.924) data 0.000 (0.009) loss 0.4415 (1.0751) lr 1.2487e-03 eta 1 day, 14:55:21
epoch [27/50] batch [100/2000] time 2.842 (2.919) data 0.000 (0.008) loss 1.1308 (1.0323) lr 1.2487e-03 eta 1 day, 14:50:03
epoch [27/50] batch [120/2000] time 2.077 (2.868) data 0.000 (0.006) loss 1.6624 (1.0378) lr 1.2487e-03 eta 1 day, 14:08:37
epoch [27/50] batch [140/2000] time 2.808 (2.823) data 0.000 (0.006) loss 2.0226 (1.0848) lr 1.2487e-03 eta 1 day, 13:31:40
epoch [27/50] batch [160/2000] time 2.849 (2.825) data 0.000 (0.005) loss 0.2982 (1.0910) lr 1.2487e-03 eta 1 day, 13:32:30
epoch [27/50] batch [180/2000] time 2.116 (2.823) data 0.000 (0.005) loss 1.0749 (1.0891) lr 1.2487e-03 eta 1 day, 13:30:04
epoch [27/50] batch [200/2000] time 2.909 (2.772) data 0.000 (0.004) loss 0.4503 (1.1199) lr 1.2487e-03 eta 1 day, 12:48:33
epoch [27/50] batch [220/2000] time 2.782 (2.781) data 0.000 (0.004) loss 0.5740 (1.1441) lr 1.2487e-03 eta 1 day, 12:54:48
epoch [27/50] batch [240/2000] time 2.858 (2.787) data 0.013 (0.004) loss 0.4045 (1.1370) lr 1.2487e-03 eta 1 day, 12:58:05
epoch [27/50] batch [260/2000] time 2.147 (2.746) data 0.000 (0.003) loss 1.8060 (1.1328) lr 1.2487e-03 eta 1 day, 12:24:58
epoch [27/50] batch [280/2000] time 2.781 (2.749) data 0.000 (0.003) loss 0.7514 (1.1746) lr 1.2487e-03 eta 1 day, 12:26:23
epoch [27/50] batch [300/2000] time 2.780 (2.756) data 0.000 (0.003) loss 0.8499 (1.1841) lr 1.2487e-03 eta 1 day, 12:30:42
epoch [27/50] batch [320/2000] time 2.102 (2.739) data 0.000 (0.003) loss 0.6657 (1.1840) lr 1.2487e-03 eta 1 day, 12:16:18
epoch [27/50] batch [340/2000] time 2.911 (2.733) data 0.000 (0.003) loss 1.2201 (1.1945) lr 1.2487e-03 eta 1 day, 12:11:17
epoch [27/50] batch [360/2000] time 2.796 (2.738) data 0.000 (0.003) loss 2.1787 (1.1846) lr 1.2487e-03 eta 1 day, 12:14:12
epoch [27/50] batch [380/2000] time 2.086 (2.735) data 0.000 (0.003) loss 1.1822 (1.1992) lr 1.2487e-03 eta 1 day, 12:10:37
epoch [27/50] batch [400/2000] time 2.796 (2.717) data 0.005 (0.002) loss 3.4056 (1.1981) lr 1.2487e-03 eta 1 day, 11:55:50
epoch [27/50] batch [420/2000] time 2.813 (2.722) data 0.002 (0.002) loss 2.3155 (1.1912) lr 1.2487e-03 eta 1 day, 11:58:22
epoch [27/50] batch [440/2000] time 3.034 (2.729) data 0.001 (0.002) loss 0.8182 (1.2081) lr 1.2487e-03 eta 1 day, 12:03:04
epoch [27/50] batch [460/2000] time 2.958 (2.706) data 0.000 (0.002) loss 0.3315 (1.2124) lr 1.2487e-03 eta 1 day, 11:44:00
epoch [27/50] batch [480/2000] time 2.964 (2.720) data 0.000 (0.002) loss 0.1795 (1.2089) lr 1.2487e-03 eta 1 day, 11:53:58
epoch [27/50] batch [500/2000] time 2.021 (2.728) data 0.000 (0.002) loss 0.2552 (1.2059) lr 1.2487e-03 eta 1 day, 11:59:52
epoch [27/50] batch [520/2000] time 2.833 (2.712) data 0.000 (0.002) loss 0.5204 (1.2041) lr 1.2487e-03 eta 1 day, 11:45:52
epoch [27/50] batch [540/2000] time 2.907 (2.719) data 0.000 (0.002) loss 2.4018 (1.2038) lr 1.2487e-03 eta 1 day, 11:50:24
epoch [27/50] batch [560/2000] time 2.830 (2.725) data 0.000 (0.002) loss 0.6688 (1.2012) lr 1.2487e-03 eta 1 day, 11:54:19
epoch [27/50] batch [580/2000] time 2.155 (2.707) data 0.000 (0.002) loss 2.0022 (1.2059) lr 1.2487e-03 eta 1 day, 11:39:23
epoch [27/50] batch [600/2000] time 2.900 (2.713) data 0.013 (0.002) loss 0.3488 (1.2006) lr 1.2487e-03 eta 1 day, 11:43:22
epoch [27/50] batch [620/2000] time 2.943 (2.719) data 0.000 (0.002) loss 0.2469 (1.2060) lr 1.2487e-03 eta 1 day, 11:47:11
epoch [27/50] batch [640/2000] time 2.149 (2.709) data 0.000 (0.002) loss 0.3590 (1.1937) lr 1.2487e-03 eta 1 day, 11:38:04
epoch [27/50] batch [660/2000] time 2.923 (2.710) data 0.000 (0.002) loss 2.4450 (1.1787) lr 1.2487e-03 eta 1 day, 11:38:28
epoch [27/50] batch [680/2000] time 2.864 (2.716) data 0.010 (0.002) loss 2.8121 (1.1769) lr 1.2487e-03 eta 1 day, 11:42:11
epoch [27/50] batch [700/2000] time 2.273 (2.711) data 0.000 (0.002) loss 0.9602 (1.1797) lr 1.2487e-03 eta 1 day, 11:37:02
epoch [27/50] batch [720/2000] time 2.862 (2.708) data 0.000 (0.002) loss 0.4355 (1.1796) lr 1.2487e-03 eta 1 day, 11:33:51
epoch [27/50] batch [740/2000] time 2.904 (2.713) data 0.000 (0.002) loss 2.3553 (1.1802) lr 1.2487e-03 eta 1 day, 11:36:33
epoch [27/50] batch [760/2000] time 2.071 (2.711) data 0.000 (0.002) loss 1.6073 (1.1768) lr 1.2487e-03 eta 1 day, 11:34:29
epoch [27/50] batch [780/2000] time 2.875 (2.705) data 0.000 (0.002) loss 0.8781 (1.1723) lr 1.2487e-03 eta 1 day, 11:28:45
epoch [27/50] batch [800/2000] time 2.933 (2.709) data 0.000 (0.002) loss 1.4485 (1.1840) lr 1.2487e-03 eta 1 day, 11:31:12
epoch [27/50] batch [820/2000] time 2.019 (2.711) data 0.002 (0.002) loss 1.3298 (1.1874) lr 1.2487e-03 eta 1 day, 11:32:07
epoch [27/50] batch [840/2000] time 2.920 (2.703) data 0.000 (0.002) loss 0.7577 (1.1858) lr 1.2487e-03 eta 1 day, 11:24:25
epoch [27/50] batch [860/2000] time 2.891 (2.707) data 0.000 (0.002) loss 0.0783 (1.1750) lr 1.2487e-03 eta 1 day, 11:26:27
epoch [27/50] batch [880/2000] time 2.873 (2.711) data 0.000 (0.001) loss 1.6827 (1.1744) lr 1.2487e-03 eta 1 day, 11:28:39
epoch [27/50] batch [900/2000] time 3.043 (2.701) data 0.001 (0.001) loss 1.8802 (1.1748) lr 1.2487e-03 eta 1 day, 11:20:02
epoch [27/50] batch [920/2000] time 2.924 (2.705) data 0.000 (0.001) loss 0.1787 (1.1672) lr 1.2487e-03 eta 1 day, 11:22:22
epoch [27/50] batch [940/2000] time 2.876 (2.709) data 0.000 (0.001) loss 1.3042 (1.1700) lr 1.2487e-03 eta 1 day, 11:24:39
epoch [27/50] batch [960/2000] time 2.200 (2.701) data 0.000 (0.001) loss 3.5169 (1.1706) lr 1.2487e-03 eta 1 day, 11:17:41
epoch [27/50] batch [980/2000] time 3.159 (2.705) data 0.000 (0.001) loss 0.4858 (1.1695) lr 1.2487e-03 eta 1 day, 11:19:42
epoch [27/50] batch [1000/2000] time 2.904 (2.711) data 0.000 (0.001) loss 1.9615 (1.1767) lr 1.2487e-03 eta 1 day, 11:23:51
epoch [27/50] batch [1020/2000] time 2.844 (2.703) data 0.000 (0.001) loss 1.7703 (1.1744) lr 1.2487e-03 eta 1 day, 11:16:04
epoch [27/50] batch [1040/2000] time 3.044 (2.707) data 0.000 (0.001) loss 1.8849 (1.1705) lr 1.2487e-03 eta 1 day, 11:18:35
epoch [27/50] batch [1060/2000] time 2.885 (2.711) data 0.000 (0.001) loss 1.7261 (1.1724) lr 1.2487e-03 eta 1 day, 11:20:52
epoch [27/50] batch [1080/2000] time 2.732 (2.704) data 0.004 (0.001) loss 0.2592 (1.1708) lr 1.2487e-03 eta 1 day, 11:14:19
epoch [27/50] batch [1100/2000] time 2.015 (2.695) data 0.000 (0.001) loss 0.2226 (1.1759) lr 1.2487e-03 eta 1 day, 11:06:33
epoch [27/50] batch [1120/2000] time 2.121 (2.686) data 0.004 (0.001) loss 0.8752 (1.1726) lr 1.2487e-03 eta 1 day, 10:58:29
epoch [27/50] batch [1140/2000] time 2.046 (2.677) data 0.001 (0.001) loss 1.4451 (1.1732) lr 1.2487e-03 eta 1 day, 10:51:05
epoch [27/50] batch [1160/2000] time 2.118 (2.669) data 0.000 (0.001) loss 1.3035 (1.1729) lr 1.2487e-03 eta 1 day, 10:43:54
epoch [27/50] batch [1180/2000] time 2.860 (2.663) data 0.000 (0.001) loss 2.1030 (1.1755) lr 1.2487e-03 eta 1 day, 10:38:00
epoch [27/50] batch [1200/2000] time 2.069 (2.656) data 0.000 (0.001) loss 0.3526 (1.1756) lr 1.2487e-03 eta 1 day, 10:31:28
epoch [27/50] batch [1220/2000] time 2.012 (2.648) data 0.000 (0.001) loss 1.2263 (1.1797) lr 1.2487e-03 eta 1 day, 10:24:49
epoch [27/50] batch [1240/2000] time 2.174 (2.642) data 0.000 (0.001) loss 0.2890 (1.1751) lr 1.2487e-03 eta 1 day, 10:18:51
epoch [27/50] batch [1260/2000] time 2.176 (2.635) data 0.000 (0.001) loss 0.7381 (1.1756) lr 1.2487e-03 eta 1 day, 10:13:00
epoch [27/50] batch [1280/2000] time 2.167 (2.629) data 0.000 (0.001) loss 0.3753 (1.1742) lr 1.2487e-03 eta 1 day, 10:07:24
epoch [27/50] batch [1300/2000] time 2.769 (2.624) data 0.000 (0.001) loss 1.0037 (1.1745) lr 1.2487e-03 eta 1 day, 10:02:21
epoch [27/50] batch [1320/2000] time 2.715 (2.619) data 0.000 (0.001) loss 0.9510 (1.1764) lr 1.2487e-03 eta 1 day, 9:57:53
epoch [27/50] batch [1340/2000] time 2.067 (2.613) data 0.001 (0.001) loss 0.1930 (1.1741) lr 1.2487e-03 eta 1 day, 9:51:47
epoch [27/50] batch [1360/2000] time 2.070 (2.606) data 0.000 (0.001) loss 0.8153 (1.1740) lr 1.2487e-03 eta 1 day, 9:45:54
epoch [27/50] batch [1380/2000] time 2.083 (2.600) data 0.000 (0.001) loss 1.0975 (1.1722) lr 1.2487e-03 eta 1 day, 9:40:25
epoch [27/50] batch [1400/2000] time 2.029 (2.594) data 0.000 (0.001) loss 0.0514 (1.1688) lr 1.2487e-03 eta 1 day, 9:34:49
epoch [27/50] batch [1420/2000] time 2.173 (2.588) data 0.003 (0.001) loss 0.4652 (1.1700) lr 1.2487e-03 eta 1 day, 9:29:26
epoch [27/50] batch [1440/2000] time 2.170 (2.583) data 0.000 (0.001) loss 1.0296 (1.1685) lr 1.2487e-03 eta 1 day, 9:24:10
epoch [27/50] batch [1460/2000] time 2.181 (2.578) data 0.000 (0.001) loss 2.3671 (1.1696) lr 1.2487e-03 eta 1 day, 9:19:38
epoch [27/50] batch [1480/2000] time 2.068 (2.573) data 0.000 (0.001) loss 0.1856 (1.1662) lr 1.2487e-03 eta 1 day, 9:14:36
epoch [27/50] batch [1500/2000] time 2.241 (2.567) data 0.000 (0.001) loss 0.2425 (1.1762) lr 1.2487e-03 eta 1 day, 9:09:41
epoch [27/50] batch [1520/2000] time 2.074 (2.562) data 0.000 (0.001) loss 2.0047 (1.1801) lr 1.2487e-03 eta 1 day, 9:05:00
epoch [27/50] batch [1540/2000] time 2.123 (2.558) data 0.000 (0.001) loss 0.4745 (1.1756) lr 1.2487e-03 eta 1 day, 9:00:22
epoch [27/50] batch [1560/2000] time 2.177 (2.553) data 0.000 (0.001) loss 0.6970 (1.1744) lr 1.2487e-03 eta 1 day, 8:55:46
epoch [27/50] batch [1580/2000] time 2.243 (2.549) data 0.000 (0.001) loss 0.9712 (1.1750) lr 1.2487e-03 eta 1 day, 8:51:54
epoch [27/50] batch [1600/2000] time 2.078 (2.545) data 0.000 (0.001) loss 0.3326 (1.1737) lr 1.2487e-03 eta 1 day, 8:47:56
epoch [27/50] batch [1620/2000] time 2.073 (2.541) data 0.000 (0.001) loss 0.7028 (1.1747) lr 1.2487e-03 eta 1 day, 8:44:10
epoch [27/50] batch [1640/2000] time 2.066 (2.537) data 0.000 (0.001) loss 0.5734 (1.1740) lr 1.2487e-03 eta 1 day, 8:40:22
epoch [27/50] batch [1660/2000] time 2.046 (2.534) data 0.000 (0.001) loss 0.3180 (1.1734) lr 1.2487e-03 eta 1 day, 8:37:03
epoch [27/50] batch [1680/2000] time 2.015 (2.530) data 0.005 (0.001) loss 2.8371 (1.1753) lr 1.2487e-03 eta 1 day, 8:33:31
epoch [27/50] batch [1700/2000] time 2.043 (2.527) data 0.000 (0.001) loss 0.1614 (1.1713) lr 1.2487e-03 eta 1 day, 8:30:18
epoch [27/50] batch [1720/2000] time 2.077 (2.525) data 0.000 (0.001) loss 0.9541 (1.1681) lr 1.2487e-03 eta 1 day, 8:27:17
epoch [27/50] batch [1740/2000] time 2.078 (2.522) data 0.000 (0.001) loss 0.2955 (1.1692) lr 1.2487e-03 eta 1 day, 8:24:09
epoch [27/50] batch [1760/2000] time 2.067 (2.519) data 0.000 (0.001) loss 0.0674 (1.1644) lr 1.2487e-03 eta 1 day, 8:21:09
epoch [27/50] batch [1780/2000] time 2.073 (2.516) data 0.000 (0.001) loss 1.6277 (1.1652) lr 1.2487e-03 eta 1 day, 8:18:17
epoch [27/50] batch [1800/2000] time 2.069 (2.514) data 0.001 (0.001) loss 0.5939 (1.1659) lr 1.2487e-03 eta 1 day, 8:15:29
epoch [27/50] batch [1820/2000] time 2.086 (2.511) data 0.003 (0.001) loss 0.4745 (1.1665) lr 1.2487e-03 eta 1 day, 8:12:51
epoch [27/50] batch [1840/2000] time 2.071 (2.509) data 0.000 (0.001) loss 0.7975 (1.1649) lr 1.2487e-03 eta 1 day, 8:10:25
epoch [27/50] batch [1860/2000] time 2.763 (2.507) data 0.000 (0.001) loss 1.4005 (1.1684) lr 1.2487e-03 eta 1 day, 8:07:42
epoch [27/50] batch [1880/2000] time 2.751 (2.504) data 0.001 (0.001) loss 0.0727 (1.1744) lr 1.2487e-03 eta 1 day, 8:04:51
epoch [27/50] batch [1900/2000] time 2.762 (2.501) data 0.000 (0.001) loss 1.6321 (1.1745) lr 1.2487e-03 eta 1 day, 8:01:57
epoch [27/50] batch [1920/2000] time 2.072 (2.499) data 0.000 (0.001) loss 1.8781 (1.1739) lr 1.2487e-03 eta 1 day, 7:58:56
epoch [27/50] batch [1940/2000] time 2.046 (2.496) data 0.000 (0.001) loss 2.6074 (1.1759) lr 1.2487e-03 eta 1 day, 7:55:51
epoch [27/50] batch [1960/2000] time 2.088 (2.493) data 0.000 (0.001) loss 1.4369 (1.1727) lr 1.2487e-03 eta 1 day, 7:52:36
epoch [27/50] batch [1980/2000] time 2.332 (2.490) data 0.000 (0.001) loss 0.0528 (1.1755) lr 1.2487e-03 eta 1 day, 7:49:35
epoch [27/50] batch [2000/2000] time 2.067 (2.487) data 0.000 (0.001) loss 2.3395 (1.1755) lr 1.1874e-03 eta 1 day, 7:46:38
epoch [28/50] batch [20/2000] time 2.167 (2.247) data 0.000 (0.035) loss 1.0836 (1.3286) lr 1.1874e-03 eta 1 day, 4:41:43
epoch [28/50] batch [40/2000] time 2.117 (2.230) data 0.000 (0.018) loss 1.2894 (1.2556) lr 1.1874e-03 eta 1 day, 4:28:04
epoch [28/50] batch [60/2000] time 2.687 (2.235) data 0.003 (0.012) loss 2.4733 (1.2404) lr 1.1874e-03 eta 1 day, 4:31:02
epoch [28/50] batch [80/2000] time 2.752 (2.237) data 0.000 (0.009) loss 0.5295 (1.2359) lr 1.1874e-03 eta 1 day, 4:31:40
epoch [28/50] batch [100/2000] time 2.065 (2.235) data 0.000 (0.007) loss 0.5925 (1.1915) lr 1.1874e-03 eta 1 day, 4:30:03
epoch [28/50] batch [120/2000] time 2.070 (2.228) data 0.000 (0.006) loss 0.2091 (1.2091) lr 1.1874e-03 eta 1 day, 4:23:27
epoch [28/50] batch [140/2000] time 2.020 (2.223) data 0.000 (0.005) loss 0.6586 (1.2350) lr 1.1874e-03 eta 1 day, 4:19:21
epoch [28/50] batch [160/2000] time 2.346 (2.223) data 0.000 (0.005) loss 0.1646 (1.2233) lr 1.1874e-03 eta 1 day, 4:18:28
epoch [28/50] batch [180/2000] time 2.240 (2.239) data 0.001 (0.004) loss 0.3608 (1.1790) lr 1.1874e-03 eta 1 day, 4:29:55
epoch [28/50] batch [200/2000] time 2.765 (2.253) data 0.000 (0.004) loss 0.9366 (1.1979) lr 1.1874e-03 eta 1 day, 4:39:37
epoch [28/50] batch [220/2000] time 2.895 (2.253) data 0.000 (0.004) loss 0.8884 (1.2525) lr 1.1874e-03 eta 1 day, 4:38:52
epoch [28/50] batch [240/2000] time 2.585 (2.254) data 0.000 (0.003) loss 1.9054 (1.2491) lr 1.1874e-03 eta 1 day, 4:39:15
epoch [28/50] batch [260/2000] time 2.174 (2.266) data 0.000 (0.003) loss 1.0328 (1.2489) lr 1.1874e-03 eta 1 day, 4:47:23
epoch [28/50] batch [280/2000] time 2.292 (2.278) data 0.000 (0.003) loss 2.9161 (1.2270) lr 1.1874e-03 eta 1 day, 4:56:08
epoch [28/50] batch [300/2000] time 2.072 (2.290) data 0.000 (0.003) loss 0.6288 (1.2148) lr 1.1874e-03 eta 1 day, 5:03:56
epoch [28/50] batch [320/2000] time 2.716 (2.293) data 0.000 (0.003) loss 0.7187 (1.2026) lr 1.1874e-03 eta 1 day, 5:05:36
epoch [28/50] batch [340/2000] time 2.523 (2.291) data 0.001 (0.003) loss 0.5669 (1.2219) lr 1.1874e-03 eta 1 day, 5:03:43
epoch [28/50] batch [360/2000] time 2.064 (2.301) data 0.000 (0.002) loss 1.1521 (1.2187) lr 1.1874e-03 eta 1 day, 5:10:17
epoch [28/50] batch [380/2000] time 2.062 (2.310) data 0.000 (0.002) loss 0.1533 (1.2036) lr 1.1874e-03 eta 1 day, 5:16:07
epoch [28/50] batch [400/2000] time 2.711 (2.317) data 0.000 (0.002) loss 0.1016 (1.1893) lr 1.1874e-03 eta 1 day, 5:20:45
epoch [28/50] batch [420/2000] time 2.731 (2.316) data 0.000 (0.002) loss 1.2036 (1.1889) lr 1.1874e-03 eta 1 day, 5:19:43
epoch [28/50] batch [440/2000] time 2.075 (2.323) data 0.000 (0.002) loss 0.4970 (1.1933) lr 1.1874e-03 eta 1 day, 5:24:01
epoch [28/50] batch [460/2000] time 2.082 (2.332) data 0.000 (0.002) loss 1.9725 (1.2154) lr 1.1874e-03 eta 1 day, 5:29:43
epoch [28/50] batch [480/2000] time 2.833 (2.334) data 0.000 (0.002) loss 1.1953 (1.2086) lr 1.1874e-03 eta 1 day, 5:30:48
epoch [28/50] batch [500/2000] time 2.141 (2.333) data 0.000 (0.002) loss 1.8249 (1.2109) lr 1.1874e-03 eta 1 day, 5:29:31
epoch [28/50] batch [520/2000] time 2.010 (2.342) data 0.000 (0.002) loss 0.4387 (1.2127) lr 1.1874e-03 eta 1 day, 5:35:18
epoch [28/50] batch [540/2000] time 2.836 (2.347) data 0.000 (0.002) loss 1.4011 (1.2123) lr 1.1874e-03 eta 1 day, 5:38:08
epoch [28/50] batch [560/2000] time 2.750 (2.343) data 0.000 (0.002) loss 2.5265 (1.2183) lr 1.1874e-03 eta 1 day, 5:34:43
epoch [28/50] batch [580/2000] time 2.105 (2.342) data 0.000 (0.002) loss 0.4534 (1.2373) lr 1.1874e-03 eta 1 day, 5:32:38
epoch [28/50] batch [600/2000] time 2.135 (2.341) data 0.001 (0.002) loss 0.3555 (1.2325) lr 1.1874e-03 eta 1 day, 5:31:20
epoch [28/50] batch [620/2000] time 2.011 (2.340) data 0.000 (0.002) loss 0.2479 (1.2188) lr 1.1874e-03 eta 1 day, 5:29:42
epoch [28/50] batch [640/2000] time 2.072 (2.340) data 0.000 (0.002) loss 1.3435 (1.2170) lr 1.1874e-03 eta 1 day, 5:29:08
epoch [28/50] batch [660/2000] time 2.328 (2.339) data 0.000 (0.002) loss 2.6247 (1.2180) lr 1.1874e-03 eta 1 day, 5:27:47
epoch [28/50] batch [680/2000] time 2.016 (2.338) data 0.000 (0.002) loss 1.2447 (1.2115) lr 1.1874e-03 eta 1 day, 5:25:56
epoch [28/50] batch [700/2000] time 2.060 (2.338) data 0.000 (0.002) loss 0.1918 (1.2110) lr 1.1874e-03 eta 1 day, 5:25:33
epoch [28/50] batch [720/2000] time 2.662 (2.338) data 0.000 (0.002) loss 2.0804 (1.2153) lr 1.1874e-03 eta 1 day, 5:24:30
epoch [28/50] batch [740/2000] time 2.796 (2.336) data 0.000 (0.001) loss 1.1173 (1.2287) lr 1.1874e-03 eta 1 day, 5:22:15
epoch [28/50] batch [760/2000] time 2.784 (2.334) data 0.004 (0.001) loss 0.7382 (1.2273) lr 1.1874e-03 eta 1 day, 5:20:11
epoch [28/50] batch [780/2000] time 2.473 (2.333) data 0.000 (0.001) loss 0.0938 (1.2287) lr 1.1874e-03 eta 1 day, 5:18:02
epoch [28/50] batch [800/2000] time 2.101 (2.332) data 0.000 (0.001) loss 2.2978 (1.2267) lr 1.1874e-03 eta 1 day, 5:16:33
epoch [28/50] batch [820/2000] time 2.076 (2.332) data 0.000 (0.001) loss 0.5645 (1.2182) lr 1.1874e-03 eta 1 day, 5:15:38
epoch [28/50] batch [840/2000] time 2.010 (2.331) data 0.000 (0.001) loss 0.6071 (1.2086) lr 1.1874e-03 eta 1 day, 5:14:48
epoch [28/50] batch [860/2000] time 2.073 (2.331) data 0.000 (0.001) loss 1.4118 (1.2045) lr 1.1874e-03 eta 1 day, 5:13:46
epoch [28/50] batch [880/2000] time 2.101 (2.331) data 0.000 (0.001) loss 2.1050 (1.2014) lr 1.1874e-03 eta 1 day, 5:12:43
epoch [28/50] batch [900/2000] time 2.934 (2.334) data 0.000 (0.001) loss 1.1660 (1.1982) lr 1.1874e-03 eta 1 day, 5:14:21
epoch [28/50] batch [920/2000] time 2.088 (2.337) data 0.000 (0.001) loss 1.3996 (1.1944) lr 1.1874e-03 eta 1 day, 5:15:51
epoch [28/50] batch [940/2000] time 2.913 (2.344) data 0.000 (0.001) loss 0.9954 (1.1961) lr 1.1874e-03 eta 1 day, 5:19:59
epoch [28/50] batch [960/2000] time 2.133 (2.344) data 0.000 (0.001) loss 1.6954 (1.1967) lr 1.1874e-03 eta 1 day, 5:19:19
epoch [28/50] batch [980/2000] time 2.781 (2.353) data 0.000 (0.001) loss 2.3678 (1.1929) lr 1.1874e-03 eta 1 day, 5:25:10
epoch [28/50] batch [1000/2000] time 2.511 (2.351) data 0.000 (0.001) loss 0.9799 (1.1940) lr 1.1874e-03 eta 1 day, 5:23:00
epoch [28/50] batch [1020/2000] time 2.814 (2.361) data 0.001 (0.001) loss 2.7290 (1.1960) lr 1.1874e-03 eta 1 day, 5:30:04
epoch [28/50] batch [1040/2000] time 2.454 (2.359) data 0.000 (0.001) loss 0.5006 (1.1892) lr 1.1874e-03 eta 1 day, 5:27:53
epoch [28/50] batch [1060/2000] time 2.825 (2.369) data 0.000 (0.001) loss 0.8035 (1.1884) lr 1.1874e-03 eta 1 day, 5:34:19
epoch [28/50] batch [1080/2000] time 2.131 (2.367) data 0.000 (0.001) loss 1.2609 (1.1824) lr 1.1874e-03 eta 1 day, 5:31:58
epoch [28/50] batch [1100/2000] time 2.851 (2.376) data 0.000 (0.001) loss 2.6292 (1.1886) lr 1.1874e-03 eta 1 day, 5:37:54
epoch [28/50] batch [1120/2000] time 2.151 (2.374) data 0.000 (0.001) loss 4.9088 (1.1880) lr 1.1874e-03 eta 1 day, 5:35:58
epoch [28/50] batch [1140/2000] time 2.843 (2.381) data 0.001 (0.001) loss 0.8448 (1.1859) lr 1.1874e-03 eta 1 day, 5:40:24
epoch [28/50] batch [1160/2000] time 2.294 (2.384) data 0.000 (0.001) loss 0.5555 (1.1817) lr 1.1874e-03 eta 1 day, 5:41:49
epoch [28/50] batch [1180/2000] time 2.786 (2.386) data 0.000 (0.001) loss 1.9461 (1.1845) lr 1.1874e-03 eta 1 day, 5:42:17
epoch [28/50] batch [1200/2000] time 2.793 (2.393) data 0.000 (0.001) loss 0.1014 (1.1782) lr 1.1874e-03 eta 1 day, 5:46:46
epoch [28/50] batch [1220/2000] time 2.813 (2.390) data 0.000 (0.001) loss 0.9187 (1.1753) lr 1.1874e-03 eta 1 day, 5:43:56
epoch [28/50] batch [1240/2000] time 2.801 (2.397) data 0.000 (0.001) loss 0.5893 (1.1732) lr 1.1874e-03 eta 1 day, 5:48:22
epoch [28/50] batch [1260/2000] time 2.077 (2.398) data 0.000 (0.001) loss 1.0914 (1.1737) lr 1.1874e-03 eta 1 day, 5:47:56
epoch [28/50] batch [1280/2000] time 2.798 (2.401) data 0.000 (0.001) loss 0.7174 (1.1739) lr 1.1874e-03 eta 1 day, 5:49:44
epoch [28/50] batch [1300/2000] time 2.699 (2.407) data 0.000 (0.001) loss 0.3439 (1.1733) lr 1.1874e-03 eta 1 day, 5:53:34
epoch [28/50] batch [1320/2000] time 2.816 (2.405) data 0.000 (0.001) loss 1.0123 (1.1777) lr 1.1874e-03 eta 1 day, 5:50:36
epoch [28/50] batch [1340/2000] time 2.861 (2.411) data 0.001 (0.001) loss 1.6481 (1.1763) lr 1.1874e-03 eta 1 day, 5:54:15
epoch [28/50] batch [1360/2000] time 2.038 (2.414) data 0.000 (0.001) loss 1.3964 (1.1802) lr 1.1874e-03 eta 1 day, 5:55:42
epoch [28/50] batch [1380/2000] time 2.872 (2.414) data 0.000 (0.001) loss 0.5198 (1.1853) lr 1.1874e-03 eta 1 day, 5:55:25
epoch [28/50] batch [1400/2000] time 2.832 (2.420) data 0.001 (0.001) loss 2.7620 (1.1883) lr 1.1874e-03 eta 1 day, 5:59:04
epoch [28/50] batch [1420/2000] time 2.174 (2.420) data 0.000 (0.001) loss 0.9517 (1.1878) lr 1.1874e-03 eta 1 day, 5:57:43
epoch [28/50] batch [1440/2000] time 2.758 (2.423) data 0.000 (0.001) loss 0.6271 (1.1831) lr 1.1874e-03 eta 1 day, 5:59:49
epoch [28/50] batch [1460/2000] time 2.950 (2.429) data 0.000 (0.001) loss 0.9885 (1.1817) lr 1.1874e-03 eta 1 day, 6:03:01
epoch [28/50] batch [1480/2000] time 2.466 (2.426) data 0.000 (0.001) loss 2.1363 (1.1867) lr 1.1874e-03 eta 1 day, 6:00:26
epoch [28/50] batch [1500/2000] time 2.812 (2.432) data 0.010 (0.001) loss 0.1586 (1.1818) lr 1.1874e-03 eta 1 day, 6:03:46
epoch [28/50] batch [1520/2000] time 2.492 (2.437) data 0.000 (0.001) loss 0.5988 (1.1808) lr 1.1874e-03 eta 1 day, 6:06:56
epoch [28/50] batch [1540/2000] time 2.872 (2.435) data 0.000 (0.001) loss 0.9578 (1.1776) lr 1.1874e-03 eta 1 day, 6:04:32
epoch [28/50] batch [1560/2000] time 2.835 (2.440) data 0.001 (0.001) loss 0.4391 (1.1742) lr 1.1874e-03 eta 1 day, 6:07:20
epoch [28/50] batch [1580/2000] time 2.066 (2.443) data 0.000 (0.001) loss 2.0737 (1.1717) lr 1.1874e-03 eta 1 day, 6:08:37
epoch [28/50] batch [1600/2000] time 2.874 (2.443) data 0.000 (0.001) loss 0.5899 (1.1697) lr 1.1874e-03 eta 1 day, 6:07:49
epoch [28/50] batch [1620/2000] time 2.228 (2.442) data 0.000 (0.001) loss 1.4320 (1.1647) lr 1.1874e-03 eta 1 day, 6:06:36
epoch [28/50] batch [1640/2000] time 2.683 (2.445) data 0.000 (0.001) loss 0.7872 (1.1611) lr 1.1874e-03 eta 1 day, 6:07:54
epoch [28/50] batch [1660/2000] time 2.956 (2.443) data 0.002 (0.001) loss 1.0853 (1.1623) lr 1.1874e-03 eta 1 day, 6:05:25
epoch [28/50] batch [1680/2000] time 2.289 (2.445) data 0.001 (0.001) loss 0.0932 (1.1607) lr 1.1874e-03 eta 1 day, 6:05:52
epoch [28/50] batch [1700/2000] time 2.841 (2.445) data 0.000 (0.001) loss 2.3348 (1.1573) lr 1.1874e-03 eta 1 day, 6:05:23
epoch [28/50] batch [1720/2000] time 2.134 (2.444) data 0.000 (0.001) loss 0.1891 (1.1582) lr 1.1874e-03 eta 1 day, 6:03:26
epoch [28/50] batch [1740/2000] time 2.065 (2.447) data 0.002 (0.001) loss 2.8742 (1.1597) lr 1.1874e-03 eta 1 day, 6:04:47
epoch [28/50] batch [1760/2000] time 2.949 (2.445) data 0.000 (0.001) loss 2.0521 (1.1576) lr 1.1874e-03 eta 1 day, 6:03:01
epoch [28/50] batch [1780/2000] time 2.033 (2.446) data 0.000 (0.001) loss 2.7600 (1.1599) lr 1.1874e-03 eta 1 day, 6:02:54
epoch [28/50] batch [1800/2000] time 2.854 (2.447) data 0.000 (0.001) loss 1.6773 (1.1600) lr 1.1874e-03 eta 1 day, 6:02:58
epoch [28/50] batch [1820/2000] time 2.114 (2.446) data 0.000 (0.001) loss 0.0766 (1.1543) lr 1.1874e-03 eta 1 day, 6:00:54
epoch [28/50] batch [1840/2000] time 2.037 (2.449) data 0.000 (0.001) loss 1.4199 (1.1553) lr 1.1874e-03 eta 1 day, 6:02:05
epoch [28/50] batch [1860/2000] time 2.768 (2.447) data 0.000 (0.001) loss 2.4157 (1.1522) lr 1.1874e-03 eta 1 day, 6:00:19
epoch [28/50] batch [1880/2000] time 2.077 (2.448) data 0.000 (0.001) loss 0.4708 (1.1544) lr 1.1874e-03 eta 1 day, 5:59:48
epoch [28/50] batch [1900/2000] time 2.879 (2.449) data 0.000 (0.001) loss 1.6204 (1.1566) lr 1.1874e-03 eta 1 day, 5:59:54
epoch [28/50] batch [1920/2000] time 2.178 (2.447) data 0.000 (0.001) loss 1.2276 (1.1584) lr 1.1874e-03 eta 1 day, 5:57:40
epoch [28/50] batch [1940/2000] time 2.053 (2.450) data 0.000 (0.001) loss 1.3375 (1.1586) lr 1.1874e-03 eta 1 day, 5:59:02
epoch [28/50] batch [1960/2000] time 2.926 (2.449) data 0.001 (0.001) loss 1.8204 (1.1592) lr 1.1874e-03 eta 1 day, 5:57:52
epoch [28/50] batch [1980/2000] time 2.151 (2.450) data 0.013 (0.001) loss 0.4660 (1.1621) lr 1.1874e-03 eta 1 day, 5:57:11
epoch [28/50] batch [2000/2000] time 2.131 (2.453) data 0.000 (0.001) loss 0.9710 (1.1613) lr 1.1253e-03 eta 1 day, 5:58:36
epoch [29/50] batch [20/2000] time 2.836 (2.593) data 0.000 (0.062) loss 1.7159 (1.0341) lr 1.1253e-03 eta 1 day, 7:40:18
epoch [29/50] batch [40/2000] time 2.138 (2.454) data 0.000 (0.032) loss 1.4163 (1.2303) lr 1.1253e-03 eta 1 day, 5:57:46
epoch [29/50] batch [60/2000] time 2.205 (2.532) data 0.001 (0.021) loss 0.4728 (1.3461) lr 1.1253e-03 eta 1 day, 6:54:14
epoch [29/50] batch [80/2000] time 2.081 (2.461) data 0.000 (0.016) loss 0.8411 (1.4014) lr 1.1253e-03 eta 1 day, 6:01:45
epoch [29/50] batch [100/2000] time 2.180 (2.416) data 0.001 (0.013) loss 0.7942 (1.3163) lr 1.1253e-03 eta 1 day, 5:27:36
epoch [29/50] batch [120/2000] time 2.165 (2.387) data 0.000 (0.011) loss 0.9007 (1.2662) lr 1.1253e-03 eta 1 day, 5:05:32
epoch [29/50] batch [140/2000] time 2.543 (2.369) data 0.000 (0.010) loss 2.4566 (1.2816) lr 1.1253e-03 eta 1 day, 4:52:01
epoch [29/50] batch [160/2000] time 2.815 (2.363) data 0.000 (0.008) loss 0.1884 (1.2234) lr 1.1253e-03 eta 1 day, 4:46:42
epoch [29/50] batch [180/2000] time 2.846 (2.355) data 0.000 (0.008) loss 0.6004 (1.1893) lr 1.1253e-03 eta 1 day, 4:40:14
epoch [29/50] batch [200/2000] time 2.719 (2.349) data 0.000 (0.007) loss 1.2033 (1.1992) lr 1.1253e-03 eta 1 day, 4:35:07
epoch [29/50] batch [220/2000] time 2.550 (2.343) data 0.000 (0.006) loss 1.9820 (1.1901) lr 1.1253e-03 eta 1 day, 4:29:45
epoch [29/50] batch [240/2000] time 2.382 (2.341) data 0.000 (0.006) loss 3.1187 (1.1952) lr 1.1253e-03 eta 1 day, 4:27:13
epoch [29/50] batch [260/2000] time 2.462 (2.337) data 0.000 (0.005) loss 0.3648 (1.1761) lr 1.1253e-03 eta 1 day, 4:23:58
epoch [29/50] batch [280/2000] time 2.074 (2.333) data 0.000 (0.005) loss 3.1025 (1.1644) lr 1.1253e-03 eta 1 day, 4:20:11
epoch [29/50] batch [300/2000] time 2.068 (2.331) data 0.000 (0.005) loss 1.8221 (1.1863) lr 1.1253e-03 eta 1 day, 4:18:02
epoch [29/50] batch [320/2000] time 2.079 (2.330) data 0.000 (0.005) loss 2.9954 (1.1774) lr 1.1253e-03 eta 1 day, 4:15:52
epoch [29/50] batch [340/2000] time 2.092 (2.328) data 0.000 (0.004) loss 0.4638 (1.1703) lr 1.1253e-03 eta 1 day, 4:14:15
epoch [29/50] batch [360/2000] time 2.197 (2.322) data 0.000 (0.004) loss 1.3807 (1.1777) lr 1.1253e-03 eta 1 day, 4:09:10
epoch [29/50] batch [380/2000] time 2.123 (2.317) data 0.000 (0.004) loss 0.8716 (1.1957) lr 1.1253e-03 eta 1 day, 4:04:10
epoch [29/50] batch [400/2000] time 2.173 (2.312) data 0.000 (0.004) loss 1.5264 (1.1939) lr 1.1253e-03 eta 1 day, 3:59:51
epoch [29/50] batch [420/2000] time 2.781 (2.308) data 0.001 (0.004) loss 1.8661 (1.1874) lr 1.1253e-03 eta 1 day, 3:56:38
epoch [29/50] batch [440/2000] time 2.170 (2.306) data 0.000 (0.003) loss 0.0757 (1.1838) lr 1.1253e-03 eta 1 day, 3:54:02
epoch [29/50] batch [460/2000] time 2.059 (2.301) data 0.000 (0.003) loss 0.4084 (1.1712) lr 1.1253e-03 eta 1 day, 3:49:36
epoch [29/50] batch [480/2000] time 2.014 (2.297) data 0.000 (0.003) loss 1.3503 (1.1780) lr 1.1253e-03 eta 1 day, 3:46:07
epoch [29/50] batch [500/2000] time 2.011 (2.293) data 0.000 (0.003) loss 0.1113 (1.1676) lr 1.1253e-03 eta 1 day, 3:42:34
epoch [29/50] batch [520/2000] time 2.116 (2.291) data 0.000 (0.003) loss 0.8999 (1.1709) lr 1.1253e-03 eta 1 day, 3:39:58
epoch [29/50] batch [540/2000] time 2.185 (2.288) data 0.000 (0.003) loss 2.1636 (1.1712) lr 1.1253e-03 eta 1 day, 3:37:27
epoch [29/50] batch [560/2000] time 2.737 (2.288) data 0.000 (0.003) loss 0.6672 (1.1846) lr 1.1253e-03 eta 1 day, 3:36:36
epoch [29/50] batch [580/2000] time 2.083 (2.285) data 0.000 (0.003) loss 1.4490 (1.1887) lr 1.1253e-03 eta 1 day, 3:33:48
epoch [29/50] batch [600/2000] time 2.049 (2.283) data 0.001 (0.003) loss 1.2851 (1.1920) lr 1.1253e-03 eta 1 day, 3:31:17
epoch [29/50] batch [620/2000] time 2.071 (2.275) data 0.000 (0.003) loss 2.0828 (1.1989) lr 1.1253e-03 eta 1 day, 3:25:09
epoch [29/50] batch [640/2000] time 2.006 (2.268) data 0.000 (0.002) loss 1.6815 (1.2033) lr 1.1253e-03 eta 1 day, 3:19:12
epoch [29/50] batch [660/2000] time 2.063 (2.261) data 0.000 (0.002) loss 1.1552 (1.2032) lr 1.1253e-03 eta 1 day, 3:13:22
epoch [29/50] batch [680/2000] time 1.985 (2.255) data 0.000 (0.002) loss 1.1995 (1.2094) lr 1.1253e-03 eta 1 day, 3:07:56
epoch [29/50] batch [700/2000] time 2.011 (2.249) data 0.005 (0.002) loss 0.0108 (1.2093) lr 1.1253e-03 eta 1 day, 3:02:46
epoch [29/50] batch [720/2000] time 2.066 (2.243) data 0.000 (0.002) loss 6.5816 (1.2103) lr 1.1253e-03 eta 1 day, 2:58:06
epoch [29/50] batch [740/2000] time 2.062 (2.238) data 0.000 (0.002) loss 1.8725 (1.2101) lr 1.1253e-03 eta 1 day, 2:53:28
epoch [29/50] batch [760/2000] time 2.014 (2.232) data 0.000 (0.002) loss 1.3167 (1.2068) lr 1.1253e-03 eta 1 day, 2:48:48
epoch [29/50] batch [780/2000] time 1.985 (2.227) data 0.000 (0.002) loss 0.4431 (1.2003) lr 1.1253e-03 eta 1 day, 2:44:23
epoch [29/50] batch [800/2000] time 2.087 (2.222) data 0.000 (0.002) loss 3.0396 (1.1927) lr 1.1253e-03 eta 1 day, 2:40:10
epoch [29/50] batch [820/2000] time 2.039 (2.218) data 0.000 (0.002) loss 1.5119 (1.1947) lr 1.1253e-03 eta 1 day, 2:36:26
epoch [29/50] batch [840/2000] time 2.041 (2.214) data 0.000 (0.002) loss 2.1185 (1.2022) lr 1.1253e-03 eta 1 day, 2:32:44
epoch [29/50] batch [860/2000] time 2.063 (2.210) data 0.000 (0.002) loss 1.4348 (1.2065) lr 1.1253e-03 eta 1 day, 2:29:11
epoch [29/50] batch [880/2000] time 2.077 (2.207) data 0.000 (0.002) loss 0.6784 (1.2020) lr 1.1253e-03 eta 1 day, 2:25:45
epoch [29/50] batch [900/2000] time 1.982 (2.203) data 0.000 (0.002) loss 0.6079 (1.1969) lr 1.1253e-03 eta 1 day, 2:22:33
epoch [29/50] batch [920/2000] time 2.073 (2.200) data 0.000 (0.002) loss 1.3612 (1.1941) lr 1.1253e-03 eta 1 day, 2:19:26
epoch [29/50] batch [940/2000] time 2.066 (2.197) data 0.000 (0.002) loss 0.4056 (1.1933) lr 1.1253e-03 eta 1 day, 2:16:29
epoch [29/50] batch [960/2000] time 2.010 (2.194) data 0.000 (0.002) loss 0.0821 (1.1911) lr 1.1253e-03 eta 1 day, 2:13:29
epoch [29/50] batch [980/2000] time 2.010 (2.190) data 0.000 (0.002) loss 0.1380 (1.1916) lr 1.1253e-03 eta 1 day, 2:10:30
epoch [29/50] batch [1000/2000] time 2.010 (2.187) data 0.000 (0.002) loss 0.6303 (1.1905) lr 1.1253e-03 eta 1 day, 2:07:41
epoch [29/50] batch [1020/2000] time 2.011 (2.185) data 0.000 (0.002) loss 0.1961 (1.1904) lr 1.1253e-03 eta 1 day, 2:04:53
epoch [29/50] batch [1040/2000] time 2.067 (2.182) data 0.000 (0.002) loss 1.7013 (1.1934) lr 1.1253e-03 eta 1 day, 2:02:11
epoch [29/50] batch [1060/2000] time 2.007 (2.179) data 0.000 (0.002) loss 1.5911 (1.1992) lr 1.1253e-03 eta 1 day, 1:59:33
epoch [29/50] batch [1080/2000] time 2.007 (2.177) data 0.000 (0.002) loss 0.8905 (1.1937) lr 1.1253e-03 eta 1 day, 1:56:57
epoch [29/50] batch [1100/2000] time 2.069 (2.174) data 0.000 (0.002) loss 3.0103 (1.1923) lr 1.1253e-03 eta 1 day, 1:54:29
epoch [29/50] batch [1120/2000] time 2.066 (2.172) data 0.000 (0.002) loss 0.2952 (1.1967) lr 1.1253e-03 eta 1 day, 1:52:03
epoch [29/50] batch [1140/2000] time 2.043 (2.170) data 0.000 (0.002) loss 0.3131 (1.1894) lr 1.1253e-03 eta 1 day, 1:49:47
epoch [29/50] batch [1160/2000] time 2.064 (2.167) data 0.000 (0.002) loss 1.0797 (1.1912) lr 1.1253e-03 eta 1 day, 1:47:25
epoch [29/50] batch [1180/2000] time 2.069 (2.165) data 0.003 (0.002) loss 1.3697 (1.1868) lr 1.1253e-03 eta 1 day, 1:45:16
epoch [29/50] batch [1200/2000] time 1.991 (2.163) data 0.000 (0.002) loss 0.6367 (1.1828) lr 1.1253e-03 eta 1 day, 1:43:03
epoch [29/50] batch [1220/2000] time 2.009 (2.161) data 0.000 (0.002) loss 2.0449 (1.1824) lr 1.1253e-03 eta 1 day, 1:40:59
epoch [29/50] batch [1240/2000] time 2.063 (2.159) data 0.000 (0.002) loss 1.2433 (1.1937) lr 1.1253e-03 eta 1 day, 1:38:54
epoch [29/50] batch [1260/2000] time 2.008 (2.158) data 0.000 (0.001) loss 2.2716 (1.1955) lr 1.1253e-03 eta 1 day, 1:36:55
epoch [29/50] batch [1280/2000] time 2.064 (2.156) data 0.000 (0.001) loss 0.0467 (1.1937) lr 1.1253e-03 eta 1 day, 1:34:58
epoch [29/50] batch [1300/2000] time 2.009 (2.154) data 0.000 (0.001) loss 1.7033 (1.1868) lr 1.1253e-03 eta 1 day, 1:32:56
epoch [29/50] batch [1320/2000] time 2.069 (2.152) data 0.000 (0.001) loss 0.7919 (1.1851) lr 1.1253e-03 eta 1 day, 1:31:02
epoch [29/50] batch [1340/2000] time 2.065 (2.151) data 0.000 (0.001) loss 0.6898 (1.1790) lr 1.1253e-03 eta 1 day, 1:29:15
epoch [29/50] batch [1360/2000] time 2.008 (2.149) data 0.000 (0.001) loss 1.7273 (1.1822) lr 1.1253e-03 eta 1 day, 1:27:27
epoch [29/50] batch [1380/2000] time 2.042 (2.148) data 0.000 (0.001) loss 0.3747 (1.1817) lr 1.1253e-03 eta 1 day, 1:25:36
epoch [29/50] batch [1400/2000] time 2.072 (2.146) data 0.000 (0.001) loss 1.2222 (1.1797) lr 1.1253e-03 eta 1 day, 1:23:49
epoch [29/50] batch [1420/2000] time 2.070 (2.145) data 0.000 (0.001) loss 1.4908 (1.1823) lr 1.1253e-03 eta 1 day, 1:22:05
epoch [29/50] batch [1440/2000] time 2.064 (2.143) data 0.000 (0.001) loss 0.4703 (1.1811) lr 1.1253e-03 eta 1 day, 1:20:25
epoch [29/50] batch [1460/2000] time 2.069 (2.142) data 0.000 (0.001) loss 0.4375 (1.1845) lr 1.1253e-03 eta 1 day, 1:18:43
epoch [29/50] batch [1480/2000] time 2.008 (2.141) data 0.000 (0.001) loss 2.2293 (1.1790) lr 1.1253e-03 eta 1 day, 1:17:06
epoch [29/50] batch [1500/2000] time 2.015 (2.140) data 0.000 (0.001) loss 2.3163 (1.1825) lr 1.1253e-03 eta 1 day, 1:15:28
epoch [29/50] batch [1520/2000] time 2.043 (2.138) data 0.000 (0.001) loss 3.2585 (1.1836) lr 1.1253e-03 eta 1 day, 1:13:59
epoch [29/50] batch [1540/2000] time 2.010 (2.137) data 0.000 (0.001) loss 1.2558 (1.1837) lr 1.1253e-03 eta 1 day, 1:12:28
epoch [29/50] batch [1560/2000] time 2.045 (2.136) data 0.000 (0.001) loss 0.6319 (1.1816) lr 1.1253e-03 eta 1 day, 1:11:00
epoch [29/50] batch [1580/2000] time 2.056 (2.135) data 0.000 (0.001) loss 1.1147 (1.1771) lr 1.1253e-03 eta 1 day, 1:09:28
epoch [29/50] batch [1600/2000] time 2.068 (2.134) data 0.000 (0.001) loss 0.3221 (1.1761) lr 1.1253e-03 eta 1 day, 1:08:02
epoch [29/50] batch [1620/2000] time 2.064 (2.133) data 0.000 (0.001) loss 0.0459 (1.1802) lr 1.1253e-03 eta 1 day, 1:06:32
epoch [29/50] batch [1640/2000] time 2.068 (2.132) data 0.000 (0.001) loss 1.7267 (1.1758) lr 1.1253e-03 eta 1 day, 1:05:01
epoch [29/50] batch [1660/2000] time 2.009 (2.131) data 0.000 (0.001) loss 0.8380 (1.1741) lr 1.1253e-03 eta 1 day, 1:03:35
epoch [29/50] batch [1680/2000] time 2.019 (2.130) data 0.001 (0.001) loss 0.4386 (1.1741) lr 1.1253e-03 eta 1 day, 1:02:11
epoch [29/50] batch [1700/2000] time 2.069 (2.129) data 0.000 (0.001) loss 0.7479 (1.1747) lr 1.1253e-03 eta 1 day, 1:00:46
epoch [29/50] batch [1720/2000] time 2.051 (2.128) data 0.000 (0.001) loss 0.7139 (1.1742) lr 1.1253e-03 eta 1 day, 0:59:26
epoch [29/50] batch [1740/2000] time 2.014 (2.127) data 0.000 (0.001) loss 1.1993 (1.1741) lr 1.1253e-03 eta 1 day, 0:58:00
epoch [29/50] batch [1760/2000] time 2.047 (2.126) data 0.000 (0.001) loss 0.8451 (1.1744) lr 1.1253e-03 eta 1 day, 0:56:40
epoch [29/50] batch [1780/2000] time 2.056 (2.125) data 0.001 (0.001) loss 0.3771 (1.1765) lr 1.1253e-03 eta 1 day, 0:55:21
epoch [29/50] batch [1800/2000] time 2.066 (2.124) data 0.000 (0.001) loss 1.3268 (1.1767) lr 1.1253e-03 eta 1 day, 0:54:02
epoch [29/50] batch [1820/2000] time 2.007 (2.123) data 0.000 (0.001) loss 0.7836 (1.1770) lr 1.1253e-03 eta 1 day, 0:52:43
epoch [29/50] batch [1840/2000] time 2.042 (2.122) data 0.000 (0.001) loss 0.6892 (1.1763) lr 1.1253e-03 eta 1 day, 0:51:23
epoch [29/50] batch [1860/2000] time 2.008 (2.122) data 0.000 (0.001) loss 0.5122 (1.1743) lr 1.1253e-03 eta 1 day, 0:50:03
epoch [29/50] batch [1880/2000] time 2.012 (2.121) data 0.000 (0.001) loss 1.2785 (1.1718) lr 1.1253e-03 eta 1 day, 0:48:48
epoch [29/50] batch [1900/2000] time 2.072 (2.120) data 0.000 (0.001) loss 1.9765 (1.1734) lr 1.1253e-03 eta 1 day, 0:47:32
epoch [29/50] batch [1920/2000] time 2.047 (2.119) data 0.000 (0.001) loss 0.3283 (1.1723) lr 1.1253e-03 eta 1 day, 0:46:15
epoch [29/50] batch [1940/2000] time 2.065 (2.118) data 0.000 (0.001) loss 0.7803 (1.1712) lr 1.1253e-03 eta 1 day, 0:44:59
epoch [29/50] batch [1960/2000] time 2.062 (2.118) data 0.000 (0.001) loss 1.6992 (1.1711) lr 1.1253e-03 eta 1 day, 0:43:43
epoch [29/50] batch [1980/2000] time 2.064 (2.117) data 0.000 (0.001) loss 1.0010 (1.1699) lr 1.1253e-03 eta 1 day, 0:42:30
epoch [29/50] batch [2000/2000] time 2.011 (2.116) data 0.000 (0.001) loss 2.6844 (1.1699) lr 1.0628e-03 eta 1 day, 0:41:13
epoch [30/50] batch [20/2000] time 2.050 (2.081) data 0.000 (0.036) loss 2.1638 (1.3951) lr 1.0628e-03 eta 1 day, 0:15:56
epoch [30/50] batch [40/2000] time 1.990 (2.062) data 0.000 (0.018) loss 0.5981 (1.2599) lr 1.0628e-03 eta 1 day, 0:01:49
epoch [30/50] batch [60/2000] time 2.048 (2.056) data 0.001 (0.012) loss 1.5450 (1.2346) lr 1.0628e-03 eta 23:57:26
epoch [30/50] batch [80/2000] time 2.066 (2.055) data 0.000 (0.009) loss 0.9713 (1.1548) lr 1.0628e-03 eta 23:55:47
epoch [30/50] batch [100/2000] time 2.010 (2.054) data 0.000 (0.007) loss 2.2208 (1.2341) lr 1.0628e-03 eta 23:54:39
epoch [30/50] batch [120/2000] time 2.081 (2.054) data 0.000 (0.006) loss 1.5590 (1.2369) lr 1.0628e-03 eta 23:53:29
epoch [30/50] batch [140/2000] time 2.069 (2.053) data 0.000 (0.005) loss 0.3383 (1.2086) lr 1.0628e-03 eta 23:52:31
epoch [30/50] batch [160/2000] time 2.049 (2.053) data 0.000 (0.005) loss 0.0552 (1.2185) lr 1.0628e-03 eta 23:51:28
epoch [30/50] batch [180/2000] time 2.028 (2.053) data 0.006 (0.004) loss 3.2059 (1.2636) lr 1.0628e-03 eta 23:50:57
epoch [30/50] batch [200/2000] time 2.061 (2.054) data 0.000 (0.004) loss 0.5369 (1.2354) lr 1.0628e-03 eta 23:50:49
epoch [30/50] batch [220/2000] time 1.989 (2.054) data 0.000 (0.004) loss 1.0423 (1.2160) lr 1.0628e-03 eta 23:50:32
epoch [30/50] batch [240/2000] time 2.006 (2.053) data 0.000 (0.003) loss 2.4026 (1.2093) lr 1.0628e-03 eta 23:49:10
epoch [30/50] batch [260/2000] time 2.034 (2.053) data 0.000 (0.003) loss 1.4929 (1.1871) lr 1.0628e-03 eta 23:48:04
epoch [30/50] batch [280/2000] time 2.058 (2.052) data 0.000 (0.003) loss 2.0503 (1.2123) lr 1.0628e-03 eta 23:46:44
epoch [30/50] batch [300/2000] time 2.059 (2.051) data 0.000 (0.003) loss 0.5773 (1.2166) lr 1.0628e-03 eta 23:45:26
epoch [30/50] batch [320/2000] time 2.006 (2.050) data 0.000 (0.003) loss 2.5990 (1.2085) lr 1.0628e-03 eta 23:44:02
epoch [30/50] batch [340/2000] time 2.007 (2.049) data 0.000 (0.003) loss 0.0678 (1.2109) lr 1.0628e-03 eta 23:42:52
epoch [30/50] batch [360/2000] time 2.007 (2.049) data 0.000 (0.002) loss 1.7994 (1.2056) lr 1.0628e-03 eta 23:41:40
epoch [30/50] batch [380/2000] time 2.010 (2.048) data 0.000 (0.002) loss 5.1204 (1.2264) lr 1.0628e-03 eta 23:40:35
epoch [30/50] batch [400/2000] time 2.062 (2.047) data 0.000 (0.002) loss 1.4737 (1.2138) lr 1.0628e-03 eta 23:39:22
epoch [30/50] batch [420/2000] time 2.035 (2.047) data 0.000 (0.002) loss 0.3555 (1.2057) lr 1.0628e-03 eta 23:38:25
epoch [30/50] batch [440/2000] time 2.058 (2.046) data 0.000 (0.002) loss 1.0417 (1.2001) lr 1.0628e-03 eta 23:37:22
epoch [30/50] batch [460/2000] time 2.036 (2.046) data 0.000 (0.002) loss 0.4077 (1.1969) lr 1.0628e-03 eta 23:36:13
epoch [30/50] batch [480/2000] time 2.068 (2.045) data 0.000 (0.002) loss 0.1844 (1.2151) lr 1.0628e-03 eta 23:35:26
epoch [30/50] batch [500/2000] time 2.065 (2.045) data 0.001 (0.002) loss 0.8389 (1.2191) lr 1.0628e-03 eta 23:34:34
epoch [30/50] batch [520/2000] time 2.058 (2.045) data 0.000 (0.002) loss 0.1680 (1.2134) lr 1.0628e-03 eta 23:33:48
epoch [30/50] batch [540/2000] time 2.061 (2.045) data 0.000 (0.002) loss 1.8072 (1.2110) lr 1.0628e-03 eta 23:32:52
epoch [30/50] batch [560/2000] time 2.007 (2.044) data 0.000 (0.002) loss 2.9889 (1.2093) lr 1.0628e-03 eta 23:32:00
epoch [30/50] batch [580/2000] time 2.044 (2.044) data 0.000 (0.002) loss 0.2301 (1.2191) lr 1.0628e-03 eta 23:31:14
epoch [30/50] batch [600/2000] time 2.044 (2.044) data 0.000 (0.002) loss 0.6730 (1.2151) lr 1.0628e-03 eta 23:30:33
epoch [30/50] batch [620/2000] time 2.063 (2.044) data 0.000 (0.002) loss 0.4642 (1.2133) lr 1.0628e-03 eta 23:29:42
epoch [30/50] batch [640/2000] time 2.051 (2.044) data 0.000 (0.001) loss 1.5980 (1.2096) lr 1.0628e-03 eta 23:29:04
epoch [30/50] batch [660/2000] time 2.045 (2.045) data 0.000 (0.001) loss 1.8215 (1.2072) lr 1.0628e-03 eta 23:28:41
epoch [30/50] batch [680/2000] time 2.047 (2.045) data 0.000 (0.001) loss 1.1087 (1.2097) lr 1.0628e-03 eta 23:28:14
epoch [30/50] batch [700/2000] time 2.063 (2.045) data 0.000 (0.001) loss 1.3947 (1.2011) lr 1.0628e-03 eta 23:27:27
epoch [30/50] batch [720/2000] time 2.023 (2.045) data 0.000 (0.001) loss 0.4243 (1.1979) lr 1.0628e-03 eta 23:26:43
epoch [30/50] batch [740/2000] time 2.134 (2.045) data 0.000 (0.001) loss 2.3132 (1.1945) lr 1.0628e-03 eta 23:26:18
epoch [30/50] batch [760/2000] time 2.058 (2.045) data 0.000 (0.001) loss 0.0312 (1.1981) lr 1.0628e-03 eta 23:25:24
epoch [30/50] batch [780/2000] time 2.033 (2.044) data 0.000 (0.001) loss 1.9032 (1.1973) lr 1.0628e-03 eta 23:24:29
epoch [30/50] batch [800/2000] time 1.990 (2.045) data 0.000 (0.001) loss 0.7808 (1.1977) lr 1.0628e-03 eta 23:23:55
epoch [30/50] batch [820/2000] time 2.019 (2.044) data 0.000 (0.001) loss 1.1717 (1.1952) lr 1.0628e-03 eta 23:23:09
epoch [30/50] batch [840/2000] time 2.057 (2.044) data 0.000 (0.001) loss 0.1240 (1.1989) lr 1.0628e-03 eta 23:22:25
epoch [30/50] batch [860/2000] time 2.008 (2.044) data 0.000 (0.001) loss 0.3539 (1.1924) lr 1.0628e-03 eta 23:21:40
epoch [30/50] batch [880/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.2904 (1.1993) lr 1.0628e-03 eta 23:21:01
epoch [30/50] batch [900/2000] time 1.980 (2.044) data 0.000 (0.001) loss 0.8366 (1.2013) lr 1.0628e-03 eta 23:20:18
epoch [30/50] batch [920/2000] time 1.980 (2.044) data 0.000 (0.001) loss 1.3778 (1.2018) lr 1.0628e-03 eta 23:19:36
epoch [30/50] batch [940/2000] time 2.063 (2.044) data 0.000 (0.001) loss 2.3358 (1.2042) lr 1.0628e-03 eta 23:18:54
epoch [30/50] batch [960/2000] time 2.065 (2.045) data 0.000 (0.001) loss 0.0431 (1.2051) lr 1.0628e-03 eta 23:18:28
epoch [30/50] batch [980/2000] time 2.006 (2.045) data 0.000 (0.001) loss 1.0109 (1.2047) lr 1.0628e-03 eta 23:17:46
epoch [30/50] batch [1000/2000] time 2.065 (2.045) data 0.000 (0.001) loss 0.1985 (1.2084) lr 1.0628e-03 eta 23:17:06
epoch [30/50] batch [1020/2000] time 2.072 (2.045) data 0.000 (0.001) loss 1.7200 (1.2144) lr 1.0628e-03 eta 23:16:29
epoch [30/50] batch [1040/2000] time 2.050 (2.045) data 0.005 (0.001) loss 0.2816 (1.2168) lr 1.0628e-03 eta 23:15:50
epoch [30/50] batch [1060/2000] time 2.039 (2.045) data 0.000 (0.001) loss 1.0508 (1.2180) lr 1.0628e-03 eta 23:15:15
epoch [30/50] batch [1080/2000] time 2.065 (2.045) data 0.000 (0.001) loss 1.7264 (1.2220) lr 1.0628e-03 eta 23:14:33
epoch [30/50] batch [1100/2000] time 2.011 (2.045) data 0.000 (0.001) loss 1.5247 (1.2199) lr 1.0628e-03 eta 23:13:58
epoch [30/50] batch [1120/2000] time 2.070 (2.045) data 0.000 (0.001) loss 1.0514 (1.2199) lr 1.0628e-03 eta 23:13:19
epoch [30/50] batch [1140/2000] time 2.068 (2.045) data 0.001 (0.001) loss 0.4472 (1.2178) lr 1.0628e-03 eta 23:12:40
epoch [30/50] batch [1160/2000] time 2.064 (2.045) data 0.000 (0.001) loss 1.4194 (1.2153) lr 1.0628e-03 eta 23:11:57
epoch [30/50] batch [1180/2000] time 2.006 (2.045) data 0.000 (0.001) loss 0.8698 (1.2155) lr 1.0628e-03 eta 23:11:10
epoch [30/50] batch [1200/2000] time 1.983 (2.045) data 0.000 (0.001) loss 0.8167 (1.2123) lr 1.0628e-03 eta 23:10:29
epoch [30/50] batch [1220/2000] time 2.112 (2.045) data 0.000 (0.001) loss 0.3873 (1.2084) lr 1.0628e-03 eta 23:09:45
epoch [30/50] batch [1240/2000] time 2.018 (2.045) data 0.000 (0.001) loss 0.4922 (1.2051) lr 1.0628e-03 eta 23:09:06
epoch [30/50] batch [1260/2000] time 2.039 (2.045) data 0.000 (0.001) loss 1.7965 (1.2030) lr 1.0628e-03 eta 23:08:28
epoch [30/50] batch [1280/2000] time 2.067 (2.045) data 0.000 (0.001) loss 0.6695 (1.2036) lr 1.0628e-03 eta 23:07:42
epoch [30/50] batch [1300/2000] time 2.006 (2.045) data 0.000 (0.001) loss 0.4621 (1.2060) lr 1.0628e-03 eta 23:06:59
epoch [30/50] batch [1320/2000] time 2.061 (2.044) data 0.000 (0.001) loss 1.9339 (1.2048) lr 1.0628e-03 eta 23:06:09
epoch [30/50] batch [1340/2000] time 2.057 (2.044) data 0.000 (0.001) loss 0.9054 (1.2050) lr 1.0628e-03 eta 23:05:24
epoch [30/50] batch [1360/2000] time 2.062 (2.044) data 0.000 (0.001) loss 0.2054 (1.1989) lr 1.0628e-03 eta 23:04:35
epoch [30/50] batch [1380/2000] time 2.006 (2.044) data 0.000 (0.001) loss 0.9525 (1.1965) lr 1.0628e-03 eta 23:03:50
epoch [30/50] batch [1400/2000] time 2.039 (2.044) data 0.000 (0.001) loss 0.7057 (1.1947) lr 1.0628e-03 eta 23:03:10
epoch [30/50] batch [1420/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.2628 (1.1926) lr 1.0628e-03 eta 23:02:24
epoch [30/50] batch [1440/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.4137 (1.1914) lr 1.0628e-03 eta 23:01:41
epoch [30/50] batch [1460/2000] time 2.042 (2.044) data 0.000 (0.001) loss 0.4049 (1.1909) lr 1.0628e-03 eta 23:00:58
epoch [30/50] batch [1480/2000] time 2.074 (2.044) data 0.000 (0.001) loss 1.8216 (1.1977) lr 1.0628e-03 eta 23:00:18
epoch [30/50] batch [1500/2000] time 2.039 (2.044) data 0.000 (0.001) loss 1.1984 (1.1961) lr 1.0628e-03 eta 22:59:33
epoch [30/50] batch [1520/2000] time 2.070 (2.044) data 0.000 (0.001) loss 0.5651 (1.1984) lr 1.0628e-03 eta 22:58:51
epoch [30/50] batch [1540/2000] time 2.039 (2.044) data 0.000 (0.001) loss 3.3839 (1.1976) lr 1.0628e-03 eta 22:58:09
epoch [30/50] batch [1560/2000] time 2.064 (2.044) data 0.000 (0.001) loss 0.1101 (1.1952) lr 1.0628e-03 eta 22:57:27
epoch [30/50] batch [1580/2000] time 2.068 (2.044) data 0.000 (0.001) loss 0.5254 (1.1913) lr 1.0628e-03 eta 22:56:46
epoch [30/50] batch [1600/2000] time 2.060 (2.044) data 0.000 (0.001) loss 0.4136 (1.1905) lr 1.0628e-03 eta 22:56:01
epoch [30/50] batch [1620/2000] time 2.042 (2.044) data 0.000 (0.001) loss 0.5036 (1.1875) lr 1.0628e-03 eta 22:55:19
epoch [30/50] batch [1640/2000] time 2.064 (2.044) data 0.000 (0.001) loss 0.2224 (1.1879) lr 1.0628e-03 eta 22:54:38
epoch [30/50] batch [1660/2000] time 2.075 (2.044) data 0.000 (0.001) loss 0.5195 (1.1849) lr 1.0628e-03 eta 22:53:59
epoch [30/50] batch [1680/2000] time 2.066 (2.044) data 0.001 (0.001) loss 2.4429 (1.1838) lr 1.0628e-03 eta 22:53:22
epoch [30/50] batch [1700/2000] time 2.041 (2.044) data 0.000 (0.001) loss 2.3948 (1.1876) lr 1.0628e-03 eta 22:52:40
epoch [30/50] batch [1720/2000] time 2.041 (2.044) data 0.000 (0.001) loss 0.1299 (1.1859) lr 1.0628e-03 eta 22:51:58
epoch [30/50] batch [1740/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.8130 (1.1899) lr 1.0628e-03 eta 22:51:18
epoch [30/50] batch [1760/2000] time 2.015 (2.044) data 0.000 (0.001) loss 0.8834 (1.1923) lr 1.0628e-03 eta 22:50:36
epoch [30/50] batch [1780/2000] time 2.035 (2.044) data 0.000 (0.001) loss 3.6074 (1.1941) lr 1.0628e-03 eta 22:49:51
epoch [30/50] batch [1800/2000] time 2.007 (2.044) data 0.000 (0.001) loss 0.1624 (1.1916) lr 1.0628e-03 eta 22:49:09
epoch [30/50] batch [1820/2000] time 2.064 (2.043) data 0.000 (0.001) loss 0.1651 (1.1948) lr 1.0628e-03 eta 22:48:26
epoch [30/50] batch [1840/2000] time 2.035 (2.043) data 0.000 (0.001) loss 0.8835 (1.1947) lr 1.0628e-03 eta 22:47:41
epoch [30/50] batch [1860/2000] time 2.005 (2.043) data 0.000 (0.001) loss 0.3739 (1.1937) lr 1.0628e-03 eta 22:46:56
epoch [30/50] batch [1880/2000] time 2.058 (2.043) data 0.000 (0.001) loss 1.0529 (1.1935) lr 1.0628e-03 eta 22:46:15
epoch [30/50] batch [1900/2000] time 2.064 (2.043) data 0.000 (0.001) loss 1.7149 (1.1956) lr 1.0628e-03 eta 22:45:32
epoch [30/50] batch [1920/2000] time 2.010 (2.043) data 0.000 (0.001) loss 0.1902 (1.1933) lr 1.0628e-03 eta 22:44:50
epoch [30/50] batch [1940/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.1357 (1.1985) lr 1.0628e-03 eta 22:44:11
epoch [30/50] batch [1960/2000] time 2.011 (2.043) data 0.000 (0.001) loss 1.2326 (1.1994) lr 1.0628e-03 eta 22:43:31
epoch [30/50] batch [1980/2000] time 2.012 (2.043) data 0.000 (0.001) loss 0.4445 (1.1978) lr 1.0628e-03 eta 22:42:48
epoch [30/50] batch [2000/2000] time 2.058 (2.043) data 0.000 (0.001) loss 3.3122 (1.2007) lr 1.0000e-03 eta 22:42:04
epoch [31/50] batch [20/2000] time 2.061 (2.074) data 0.000 (0.029) loss 1.7902 (1.3026) lr 1.0000e-03 eta 23:01:51
epoch [31/50] batch [40/2000] time 2.071 (2.057) data 0.000 (0.015) loss 1.9402 (1.4085) lr 1.0000e-03 eta 22:49:38
epoch [31/50] batch [60/2000] time 2.071 (2.053) data 0.001 (0.010) loss 2.1292 (1.2573) lr 1.0000e-03 eta 22:46:47
epoch [31/50] batch [80/2000] time 2.068 (2.052) data 0.000 (0.007) loss 1.5429 (1.2583) lr 1.0000e-03 eta 22:45:11
epoch [31/50] batch [100/2000] time 2.071 (2.052) data 0.000 (0.006) loss 1.3410 (1.2415) lr 1.0000e-03 eta 22:44:46
epoch [31/50] batch [120/2000] time 2.068 (2.052) data 0.000 (0.005) loss 2.0536 (1.2374) lr 1.0000e-03 eta 22:43:35
epoch [31/50] batch [140/2000] time 2.069 (2.051) data 0.000 (0.004) loss 1.6032 (1.2192) lr 1.0000e-03 eta 22:42:37
epoch [31/50] batch [160/2000] time 2.069 (2.051) data 0.000 (0.004) loss 1.0440 (1.1699) lr 1.0000e-03 eta 22:41:41
epoch [31/50] batch [180/2000] time 2.067 (2.050) data 0.000 (0.004) loss 1.1697 (1.1588) lr 1.0000e-03 eta 22:40:22
epoch [31/50] batch [200/2000] time 2.012 (2.049) data 0.000 (0.003) loss 2.0016 (1.1731) lr 1.0000e-03 eta 22:39:10
epoch [31/50] batch [220/2000] time 2.067 (2.049) data 0.000 (0.003) loss 0.7607 (1.1686) lr 1.0000e-03 eta 22:38:20
epoch [31/50] batch [240/2000] time 2.043 (2.049) data 0.000 (0.003) loss 1.9308 (1.2169) lr 1.0000e-03 eta 22:37:37
epoch [31/50] batch [260/2000] time 2.047 (2.049) data 0.000 (0.003) loss 1.4319 (1.2355) lr 1.0000e-03 eta 22:36:55
epoch [31/50] batch [280/2000] time 2.049 (2.049) data 0.000 (0.002) loss 0.3424 (1.2589) lr 1.0000e-03 eta 22:36:37
epoch [31/50] batch [300/2000] time 2.048 (2.049) data 0.000 (0.002) loss 0.5367 (1.2406) lr 1.0000e-03 eta 22:35:58
epoch [31/50] batch [320/2000] time 2.068 (2.049) data 0.000 (0.002) loss 0.4241 (1.2380) lr 1.0000e-03 eta 22:35:16
epoch [31/50] batch [340/2000] time 2.068 (2.049) data 0.000 (0.002) loss 0.9227 (1.2429) lr 1.0000e-03 eta 22:34:38
epoch [31/50] batch [360/2000] time 2.044 (2.049) data 0.000 (0.002) loss 0.2016 (1.2280) lr 1.0000e-03 eta 22:33:52
epoch [31/50] batch [380/2000] time 2.012 (2.049) data 0.000 (0.002) loss 1.5028 (1.2112) lr 1.0000e-03 eta 22:33:06
epoch [31/50] batch [400/2000] time 2.046 (2.049) data 0.000 (0.002) loss 0.3941 (1.1998) lr 1.0000e-03 eta 22:32:20
epoch [31/50] batch [420/2000] time 2.065 (2.049) data 0.000 (0.002) loss 1.8819 (1.2166) lr 1.0000e-03 eta 22:31:33
epoch [31/50] batch [440/2000] time 2.044 (2.049) data 0.000 (0.002) loss 3.1845 (1.2058) lr 1.0000e-03 eta 22:30:47
epoch [31/50] batch [460/2000] time 2.041 (2.049) data 0.000 (0.002) loss 0.2366 (1.1888) lr 1.0000e-03 eta 22:30:10
epoch [31/50] batch [480/2000] time 2.069 (2.049) data 0.000 (0.002) loss 0.8873 (1.1897) lr 1.0000e-03 eta 22:29:24
epoch [31/50] batch [500/2000] time 2.017 (2.049) data 0.001 (0.002) loss 0.6881 (1.1847) lr 1.0000e-03 eta 22:28:42
epoch [31/50] batch [520/2000] time 2.076 (2.049) data 0.000 (0.002) loss 0.7650 (1.1927) lr 1.0000e-03 eta 22:28:10
epoch [31/50] batch [540/2000] time 2.050 (2.050) data 0.000 (0.001) loss 0.0453 (1.1943) lr 1.0000e-03 eta 22:28:19
epoch [31/50] batch [560/2000] time 2.070 (2.050) data 0.000 (0.001) loss 0.4701 (1.1934) lr 1.0000e-03 eta 22:27:49
epoch [31/50] batch [580/2000] time 2.010 (2.050) data 0.000 (0.001) loss 0.7658 (1.1951) lr 1.0000e-03 eta 22:26:57
epoch [31/50] batch [600/2000] time 2.047 (2.050) data 0.001 (0.001) loss 0.5927 (1.1832) lr 1.0000e-03 eta 22:26:12
epoch [31/50] batch [620/2000] time 2.074 (2.050) data 0.000 (0.001) loss 0.9832 (1.1798) lr 1.0000e-03 eta 22:25:24
epoch [31/50] batch [640/2000] time 2.160 (2.050) data 0.000 (0.001) loss 0.0623 (1.1725) lr 1.0000e-03 eta 22:24:55
epoch [31/50] batch [660/2000] time 2.015 (2.050) data 0.000 (0.001) loss 0.6323 (1.1693) lr 1.0000e-03 eta 22:24:26
epoch [31/50] batch [680/2000] time 2.009 (2.050) data 0.000 (0.001) loss 0.1997 (1.1628) lr 1.0000e-03 eta 22:23:32
epoch [31/50] batch [700/2000] time 2.047 (2.050) data 0.000 (0.001) loss 0.7765 (1.1722) lr 1.0000e-03 eta 22:22:55
epoch [31/50] batch [720/2000] time 2.068 (2.050) data 0.000 (0.001) loss 0.6484 (1.1652) lr 1.0000e-03 eta 22:22:06
epoch [31/50] batch [740/2000] time 2.008 (2.050) data 0.001 (0.001) loss 0.6422 (1.1608) lr 1.0000e-03 eta 22:21:26
epoch [31/50] batch [760/2000] time 2.070 (2.050) data 0.000 (0.001) loss 1.6789 (1.1680) lr 1.0000e-03 eta 22:20:41
epoch [31/50] batch [780/2000] time 2.067 (2.050) data 0.000 (0.001) loss 0.9390 (1.1692) lr 1.0000e-03 eta 22:19:58
epoch [31/50] batch [800/2000] time 2.064 (2.049) data 0.000 (0.001) loss 0.5880 (1.1630) lr 1.0000e-03 eta 22:19:00
epoch [31/50] batch [820/2000] time 2.068 (2.049) data 0.000 (0.001) loss 1.2669 (1.1662) lr 1.0000e-03 eta 22:18:17
epoch [31/50] batch [840/2000] time 2.066 (2.049) data 0.000 (0.001) loss 2.2175 (1.1659) lr 1.0000e-03 eta 22:17:25
epoch [31/50] batch [860/2000] time 2.012 (2.049) data 0.000 (0.001) loss 0.3791 (1.1656) lr 1.0000e-03 eta 22:16:42
epoch [31/50] batch [880/2000] time 2.080 (2.049) data 0.000 (0.001) loss 0.6538 (1.1642) lr 1.0000e-03 eta 22:15:55
epoch [31/50] batch [900/2000] time 2.023 (2.049) data 0.000 (0.001) loss 0.4882 (1.1675) lr 1.0000e-03 eta 22:15:11
epoch [31/50] batch [920/2000] time 2.010 (2.049) data 0.000 (0.001) loss 0.4254 (1.1747) lr 1.0000e-03 eta 22:14:27
epoch [31/50] batch [940/2000] time 2.064 (2.049) data 0.000 (0.001) loss 0.5382 (1.1751) lr 1.0000e-03 eta 22:13:48
epoch [31/50] batch [960/2000] time 2.068 (2.049) data 0.000 (0.001) loss 0.2921 (1.1764) lr 1.0000e-03 eta 22:12:58
epoch [31/50] batch [980/2000] time 2.066 (2.048) data 0.000 (0.001) loss 0.5749 (1.1740) lr 1.0000e-03 eta 22:12:10
epoch [31/50] batch [1000/2000] time 2.067 (2.048) data 0.000 (0.001) loss 0.4892 (1.1738) lr 1.0000e-03 eta 22:11:28
epoch [31/50] batch [1020/2000] time 2.065 (2.048) data 0.000 (0.001) loss 0.2938 (1.1762) lr 1.0000e-03 eta 22:10:48
epoch [31/50] batch [1040/2000] time 2.070 (2.048) data 0.000 (0.001) loss 4.6924 (1.1750) lr 1.0000e-03 eta 22:10:00
epoch [31/50] batch [1060/2000] time 2.045 (2.048) data 0.000 (0.001) loss 1.9545 (1.1669) lr 1.0000e-03 eta 22:09:19
epoch [31/50] batch [1080/2000] time 2.041 (2.048) data 0.000 (0.001) loss 0.3109 (1.1656) lr 1.0000e-03 eta 22:08:36
epoch [31/50] batch [1100/2000] time 2.041 (2.048) data 0.000 (0.001) loss 0.6460 (1.1661) lr 1.0000e-03 eta 22:07:47
epoch [31/50] batch [1120/2000] time 2.063 (2.048) data 0.000 (0.001) loss 1.3774 (1.1617) lr 1.0000e-03 eta 22:07:06
epoch [31/50] batch [1140/2000] time 1.986 (2.048) data 0.000 (0.001) loss 0.8432 (1.1606) lr 1.0000e-03 eta 22:06:20
epoch [31/50] batch [1160/2000] time 2.067 (2.048) data 0.000 (0.001) loss 1.1100 (1.1656) lr 1.0000e-03 eta 22:05:34
epoch [31/50] batch [1180/2000] time 2.072 (2.048) data 0.000 (0.001) loss 0.2177 (1.1670) lr 1.0000e-03 eta 22:04:53
epoch [31/50] batch [1200/2000] time 2.006 (2.048) data 0.000 (0.001) loss 2.3639 (1.1685) lr 1.0000e-03 eta 22:04:09
epoch [31/50] batch [1220/2000] time 2.063 (2.048) data 0.000 (0.001) loss 1.3833 (1.1634) lr 1.0000e-03 eta 22:03:23
epoch [31/50] batch [1240/2000] time 2.012 (2.047) data 0.000 (0.001) loss 1.1026 (1.1636) lr 1.0000e-03 eta 22:02:39
epoch [31/50] batch [1260/2000] time 2.067 (2.047) data 0.000 (0.001) loss 1.1258 (1.1599) lr 1.0000e-03 eta 22:01:55
epoch [31/50] batch [1280/2000] time 2.050 (2.047) data 0.005 (0.001) loss 0.9739 (1.1633) lr 1.0000e-03 eta 22:01:11
epoch [31/50] batch [1300/2000] time 2.007 (2.047) data 0.000 (0.001) loss 2.6999 (1.1611) lr 1.0000e-03 eta 22:00:22
epoch [31/50] batch [1320/2000] time 2.048 (2.047) data 0.000 (0.001) loss 1.1807 (1.1581) lr 1.0000e-03 eta 21:59:39
epoch [31/50] batch [1340/2000] time 2.077 (2.047) data 0.000 (0.001) loss 1.6730 (1.1608) lr 1.0000e-03 eta 21:59:01
epoch [31/50] batch [1360/2000] time 2.058 (2.047) data 0.000 (0.001) loss 0.2560 (1.1632) lr 1.0000e-03 eta 21:58:19
epoch [31/50] batch [1380/2000] time 2.065 (2.047) data 0.000 (0.001) loss 1.5202 (1.1664) lr 1.0000e-03 eta 21:57:31
epoch [31/50] batch [1400/2000] time 2.004 (2.047) data 0.000 (0.001) loss 1.6652 (1.1632) lr 1.0000e-03 eta 21:56:43
epoch [31/50] batch [1420/2000] time 2.038 (2.047) data 0.000 (0.001) loss 0.4975 (1.1645) lr 1.0000e-03 eta 21:55:55
epoch [31/50] batch [1440/2000] time 2.007 (2.046) data 0.000 (0.001) loss 0.4679 (1.1627) lr 1.0000e-03 eta 21:55:07
epoch [31/50] batch [1460/2000] time 2.006 (2.046) data 0.000 (0.001) loss 1.2712 (1.1649) lr 1.0000e-03 eta 21:54:17
epoch [31/50] batch [1480/2000] time 2.039 (2.046) data 0.000 (0.001) loss 1.4343 (1.1694) lr 1.0000e-03 eta 21:53:37
epoch [31/50] batch [1500/2000] time 2.062 (2.046) data 0.000 (0.001) loss 1.4514 (1.1658) lr 1.0000e-03 eta 21:52:53
epoch [31/50] batch [1520/2000] time 1.985 (2.046) data 0.000 (0.001) loss 0.6386 (1.1654) lr 1.0000e-03 eta 21:52:14
epoch [31/50] batch [1540/2000] time 2.028 (2.046) data 0.000 (0.001) loss 1.2856 (1.1666) lr 1.0000e-03 eta 21:51:32
epoch [31/50] batch [1560/2000] time 1.988 (2.046) data 0.000 (0.001) loss 2.2851 (1.1637) lr 1.0000e-03 eta 21:50:47
epoch [31/50] batch [1580/2000] time 2.074 (2.046) data 0.000 (0.001) loss 0.4546 (1.1648) lr 1.0000e-03 eta 21:50:08
epoch [31/50] batch [1600/2000] time 1.988 (2.046) data 0.000 (0.001) loss 0.6664 (1.1659) lr 1.0000e-03 eta 21:49:28
epoch [31/50] batch [1620/2000] time 2.066 (2.046) data 0.000 (0.001) loss 0.8547 (1.1680) lr 1.0000e-03 eta 21:48:48
epoch [31/50] batch [1640/2000] time 1.990 (2.046) data 0.000 (0.001) loss 4.3264 (1.1717) lr 1.0000e-03 eta 21:48:07
epoch [31/50] batch [1660/2000] time 2.040 (2.046) data 0.000 (0.001) loss 1.0612 (1.1702) lr 1.0000e-03 eta 21:47:24
epoch [31/50] batch [1680/2000] time 2.044 (2.046) data 0.001 (0.001) loss 1.7351 (1.1709) lr 1.0000e-03 eta 21:46:40
epoch [31/50] batch [1700/2000] time 2.024 (2.046) data 0.001 (0.001) loss 0.8621 (1.1710) lr 1.0000e-03 eta 21:45:57
epoch [31/50] batch [1720/2000] time 2.020 (2.046) data 0.000 (0.001) loss 2.2069 (1.1725) lr 1.0000e-03 eta 21:45:18
epoch [31/50] batch [1740/2000] time 2.066 (2.046) data 0.000 (0.001) loss 1.7613 (1.1689) lr 1.0000e-03 eta 21:44:39
epoch [31/50] batch [1760/2000] time 2.081 (2.046) data 0.000 (0.001) loss 0.8172 (1.1665) lr 1.0000e-03 eta 21:43:56
epoch [31/50] batch [1780/2000] time 2.017 (2.046) data 0.000 (0.001) loss 1.6920 (1.1678) lr 1.0000e-03 eta 21:43:19
epoch [31/50] batch [1800/2000] time 1.988 (2.046) data 0.000 (0.001) loss 0.2709 (1.1654) lr 1.0000e-03 eta 21:42:37
epoch [31/50] batch [1820/2000] time 2.070 (2.046) data 0.000 (0.001) loss 2.1788 (1.1670) lr 1.0000e-03 eta 21:41:51
epoch [31/50] batch [1840/2000] time 2.007 (2.046) data 0.000 (0.001) loss 2.6121 (1.1629) lr 1.0000e-03 eta 21:41:09
epoch [31/50] batch [1860/2000] time 2.008 (2.046) data 0.000 (0.001) loss 1.7832 (1.1601) lr 1.0000e-03 eta 21:40:25
epoch [31/50] batch [1880/2000] time 2.035 (2.046) data 0.000 (0.001) loss 1.3167 (1.1621) lr 1.0000e-03 eta 21:39:41
epoch [31/50] batch [1900/2000] time 2.058 (2.046) data 0.000 (0.001) loss 1.6721 (1.1628) lr 1.0000e-03 eta 21:38:56
epoch [31/50] batch [1920/2000] time 2.063 (2.046) data 0.000 (0.001) loss 1.4606 (1.1634) lr 1.0000e-03 eta 21:38:15
epoch [31/50] batch [1940/2000] time 2.018 (2.046) data 0.000 (0.001) loss 1.5164 (1.1643) lr 1.0000e-03 eta 21:37:32
epoch [31/50] batch [1960/2000] time 2.062 (2.045) data 0.000 (0.001) loss 0.1393 (1.1631) lr 1.0000e-03 eta 21:36:48
epoch [31/50] batch [1980/2000] time 2.006 (2.045) data 0.000 (0.001) loss 0.1998 (1.1625) lr 1.0000e-03 eta 21:36:03
epoch [31/50] batch [2000/2000] time 1.986 (2.045) data 0.000 (0.001) loss 0.5460 (1.1613) lr 9.3721e-04 eta 21:35:19
epoch [32/50] batch [20/2000] time 2.011 (2.073) data 0.000 (0.028) loss 1.8860 (1.1502) lr 9.3721e-04 eta 21:52:03
epoch [32/50] batch [40/2000] time 2.038 (2.057) data 0.000 (0.014) loss 0.7116 (1.1959) lr 9.3721e-04 eta 21:41:17
epoch [32/50] batch [60/2000] time 2.057 (2.051) data 0.001 (0.009) loss 0.4229 (1.2068) lr 9.3721e-04 eta 21:37:00
epoch [32/50] batch [80/2000] time 2.057 (2.048) data 0.000 (0.007) loss 1.5419 (1.2374) lr 9.3721e-04 eta 21:34:19
epoch [32/50] batch [100/2000] time 1.990 (2.047) data 0.000 (0.006) loss 2.1915 (1.2625) lr 9.3721e-04 eta 21:33:18
epoch [32/50] batch [120/2000] time 2.063 (2.047) data 0.000 (0.005) loss 0.7586 (1.2246) lr 9.3721e-04 eta 21:32:19
epoch [32/50] batch [140/2000] time 2.009 (2.047) data 0.000 (0.004) loss 0.2049 (1.2296) lr 9.3721e-04 eta 21:31:23
epoch [32/50] batch [160/2000] time 2.066 (2.047) data 0.000 (0.004) loss 0.6449 (1.2290) lr 9.3721e-04 eta 21:30:41
epoch [32/50] batch [180/2000] time 2.041 (2.046) data 0.000 (0.003) loss 1.1728 (1.2031) lr 9.3721e-04 eta 21:29:55
epoch [32/50] batch [200/2000] time 2.046 (2.046) data 0.000 (0.003) loss 2.1596 (1.2197) lr 9.3721e-04 eta 21:28:57
epoch [32/50] batch [220/2000] time 2.052 (2.046) data 0.000 (0.003) loss 1.9637 (1.2208) lr 9.3721e-04 eta 21:28:27
epoch [32/50] batch [240/2000] time 2.045 (2.046) data 0.000 (0.003) loss 0.2246 (1.2268) lr 9.3721e-04 eta 21:27:40
epoch [32/50] batch [260/2000] time 2.039 (2.046) data 0.000 (0.002) loss 1.9147 (1.2265) lr 9.3721e-04 eta 21:26:57
epoch [32/50] batch [280/2000] time 2.069 (2.046) data 0.000 (0.002) loss 1.8226 (1.2045) lr 9.3721e-04 eta 21:26:20
epoch [32/50] batch [300/2000] time 2.015 (2.046) data 0.000 (0.002) loss 2.0720 (1.2118) lr 9.3721e-04 eta 21:25:26
epoch [32/50] batch [320/2000] time 2.007 (2.045) data 0.000 (0.002) loss 0.6532 (1.2043) lr 9.3721e-04 eta 21:24:30
epoch [32/50] batch [340/2000] time 2.036 (2.045) data 0.000 (0.002) loss 0.8961 (1.2005) lr 9.3721e-04 eta 21:23:20
epoch [32/50] batch [360/2000] time 2.066 (2.045) data 0.000 (0.002) loss 2.2316 (1.2119) lr 9.3721e-04 eta 21:22:35
epoch [32/50] batch [380/2000] time 2.059 (2.044) data 0.000 (0.002) loss 1.2944 (1.2156) lr 9.3721e-04 eta 21:21:46
epoch [32/50] batch [400/2000] time 2.011 (2.044) data 0.000 (0.002) loss 1.1882 (1.2131) lr 9.3721e-04 eta 21:20:39
epoch [32/50] batch [420/2000] time 2.061 (2.044) data 0.000 (0.002) loss 1.5509 (1.2091) lr 9.3721e-04 eta 21:19:56
epoch [32/50] batch [440/2000] time 2.019 (2.044) data 0.001 (0.002) loss 1.1511 (1.2007) lr 9.3721e-04 eta 21:19:18
epoch [32/50] batch [460/2000] time 2.052 (2.044) data 0.000 (0.002) loss 0.2575 (1.1922) lr 9.3721e-04 eta 21:19:05
epoch [32/50] batch [480/2000] time 2.041 (2.045) data 0.000 (0.002) loss 0.8968 (1.1824) lr 9.3721e-04 eta 21:18:38
epoch [32/50] batch [500/2000] time 2.068 (2.045) data 0.000 (0.001) loss 2.0905 (1.1820) lr 9.3721e-04 eta 21:18:00
epoch [32/50] batch [520/2000] time 2.014 (2.044) data 0.000 (0.001) loss 0.2695 (1.1879) lr 9.3721e-04 eta 21:17:02
epoch [32/50] batch [540/2000] time 2.061 (2.044) data 0.000 (0.001) loss 0.5961 (1.1857) lr 9.3721e-04 eta 21:16:10
epoch [32/50] batch [560/2000] time 2.060 (2.044) data 0.000 (0.001) loss 0.7449 (1.1871) lr 9.3721e-04 eta 21:15:21
epoch [32/50] batch [580/2000] time 2.043 (2.044) data 0.000 (0.001) loss 3.0459 (1.1820) lr 9.3721e-04 eta 21:14:33
epoch [32/50] batch [600/2000] time 2.064 (2.044) data 0.001 (0.001) loss 1.1391 (1.1857) lr 9.3721e-04 eta 21:13:54
epoch [32/50] batch [620/2000] time 2.011 (2.044) data 0.000 (0.001) loss 1.8588 (1.1841) lr 9.3721e-04 eta 21:13:17
epoch [32/50] batch [640/2000] time 2.039 (2.044) data 0.000 (0.001) loss 0.1553 (1.1848) lr 9.3721e-04 eta 21:12:30
epoch [32/50] batch [660/2000] time 2.038 (2.044) data 0.000 (0.001) loss 1.5240 (1.1905) lr 9.3721e-04 eta 21:11:53
epoch [32/50] batch [680/2000] time 2.065 (2.044) data 0.000 (0.001) loss 0.1026 (1.1893) lr 9.3721e-04 eta 21:11:10
epoch [32/50] batch [700/2000] time 2.037 (2.044) data 0.000 (0.001) loss 1.4146 (1.1886) lr 9.3721e-04 eta 21:10:23
epoch [32/50] batch [720/2000] time 2.009 (2.043) data 0.000 (0.001) loss 0.2151 (1.1819) lr 9.3721e-04 eta 21:09:33
epoch [32/50] batch [740/2000] time 2.076 (2.043) data 0.000 (0.001) loss 0.5939 (1.1806) lr 9.3721e-04 eta 21:08:58
epoch [32/50] batch [760/2000] time 2.009 (2.043) data 0.000 (0.001) loss 0.8726 (1.1816) lr 9.3721e-04 eta 21:08:17
epoch [32/50] batch [780/2000] time 2.062 (2.043) data 0.000 (0.001) loss 0.0117 (1.1698) lr 9.3721e-04 eta 21:07:35
epoch [32/50] batch [800/2000] time 2.094 (2.051) data 0.000 (0.001) loss 1.2626 (1.1714) lr 9.3721e-04 eta 21:11:53
epoch [32/50] batch [820/2000] time 2.137 (2.054) data 0.001 (0.001) loss 0.3380 (1.1742) lr 9.3721e-04 eta 21:12:35
epoch [32/50] batch [840/2000] time 2.186 (2.061) data 0.000 (0.001) loss 0.7340 (1.1709) lr 9.3721e-04 eta 21:16:40
epoch [32/50] batch [860/2000] time 2.143 (2.063) data 0.000 (0.001) loss 1.3457 (1.1712) lr 9.3721e-04 eta 21:17:13
epoch [32/50] batch [880/2000] time 2.136 (2.070) data 0.000 (0.001) loss 0.5753 (1.1698) lr 9.3721e-04 eta 21:20:45
epoch [32/50] batch [900/2000] time 2.059 (2.071) data 0.000 (0.001) loss 0.6651 (1.1710) lr 9.3721e-04 eta 21:20:40
epoch [32/50] batch [920/2000] time 2.066 (2.071) data 0.000 (0.001) loss 1.0393 (1.1725) lr 9.3721e-04 eta 21:19:37
epoch [32/50] batch [940/2000] time 2.010 (2.070) data 0.000 (0.001) loss 2.0987 (1.1743) lr 9.3721e-04 eta 21:18:38
epoch [32/50] batch [960/2000] time 2.066 (2.069) data 0.000 (0.001) loss 1.3579 (1.1712) lr 9.3721e-04 eta 21:17:31
epoch [32/50] batch [980/2000] time 2.061 (2.069) data 0.000 (0.001) loss 0.5567 (1.1766) lr 9.3721e-04 eta 21:16:29
epoch [32/50] batch [1000/2000] time 2.061 (2.068) data 0.000 (0.001) loss 0.5582 (1.1831) lr 9.3721e-04 eta 21:15:23
epoch [32/50] batch [1020/2000] time 2.009 (2.068) data 0.000 (0.001) loss 3.3968 (1.1850) lr 9.3721e-04 eta 21:14:23
epoch [32/50] batch [1040/2000] time 2.059 (2.067) data 0.000 (0.001) loss 0.1931 (1.1818) lr 9.3721e-04 eta 21:13:27
epoch [32/50] batch [1060/2000] time 2.035 (2.067) data 0.000 (0.001) loss 1.3709 (1.1812) lr 9.3721e-04 eta 21:12:25
epoch [32/50] batch [1080/2000] time 2.037 (2.066) data 0.000 (0.001) loss 0.4244 (1.1788) lr 9.3721e-04 eta 21:11:29
epoch [32/50] batch [1100/2000] time 2.061 (2.066) data 0.000 (0.001) loss 0.7545 (1.1786) lr 9.3721e-04 eta 21:10:32
epoch [32/50] batch [1120/2000] time 2.038 (2.066) data 0.000 (0.001) loss 0.5432 (1.1800) lr 9.3721e-04 eta 21:09:39
epoch [32/50] batch [1140/2000] time 2.065 (2.065) data 0.001 (0.001) loss 1.9280 (1.1816) lr 9.3721e-04 eta 21:08:46
epoch [32/50] batch [1160/2000] time 2.044 (2.065) data 0.000 (0.001) loss 1.4260 (1.1789) lr 9.3721e-04 eta 21:07:48
epoch [32/50] batch [1180/2000] time 2.058 (2.064) data 0.000 (0.001) loss 0.0840 (1.1731) lr 9.3721e-04 eta 21:06:46
epoch [32/50] batch [1200/2000] time 2.035 (2.064) data 0.000 (0.001) loss 1.8456 (1.1688) lr 9.3721e-04 eta 21:05:50
epoch [32/50] batch [1220/2000] time 2.059 (2.063) data 0.000 (0.001) loss 0.7630 (1.1696) lr 9.3721e-04 eta 21:04:50
epoch [32/50] batch [1240/2000] time 2.040 (2.063) data 0.000 (0.001) loss 0.9556 (1.1702) lr 9.3721e-04 eta 21:03:47
epoch [32/50] batch [1260/2000] time 2.059 (2.062) data 0.000 (0.001) loss 0.7216 (1.1688) lr 9.3721e-04 eta 21:02:55
epoch [32/50] batch [1280/2000] time 2.032 (2.062) data 0.000 (0.001) loss 0.2389 (1.1670) lr 9.3721e-04 eta 21:01:56
epoch [32/50] batch [1300/2000] time 2.004 (2.062) data 0.000 (0.001) loss 0.8181 (1.1614) lr 9.3721e-04 eta 21:01:03
epoch [32/50] batch [1320/2000] time 2.040 (2.061) data 0.000 (0.001) loss 0.7814 (1.1641) lr 9.3721e-04 eta 21:00:10
epoch [32/50] batch [1340/2000] time 2.071 (2.061) data 0.000 (0.001) loss 1.0236 (1.1629) lr 9.3721e-04 eta 20:59:19
epoch [32/50] batch [1360/2000] time 2.060 (2.061) data 0.000 (0.001) loss 0.0347 (1.1606) lr 9.3721e-04 eta 20:58:29
epoch [32/50] batch [1380/2000] time 2.061 (2.061) data 0.000 (0.001) loss 1.2782 (1.1602) lr 9.3721e-04 eta 20:57:36
epoch [32/50] batch [1400/2000] time 2.007 (2.060) data 0.000 (0.001) loss 2.4935 (1.1648) lr 9.3721e-04 eta 20:56:42
epoch [32/50] batch [1420/2000] time 2.061 (2.060) data 0.000 (0.001) loss 2.1124 (1.1724) lr 9.3721e-04 eta 20:55:54
epoch [32/50] batch [1440/2000] time 2.010 (2.060) data 0.000 (0.001) loss 3.6892 (1.1711) lr 9.3721e-04 eta 20:55:01
epoch [32/50] batch [1460/2000] time 2.065 (2.060) data 0.000 (0.001) loss 0.4929 (1.1789) lr 9.3721e-04 eta 20:54:16
epoch [32/50] batch [1480/2000] time 2.072 (2.059) data 0.000 (0.001) loss 1.4422 (1.1763) lr 9.3721e-04 eta 20:53:27
epoch [32/50] batch [1500/2000] time 2.009 (2.059) data 0.000 (0.001) loss 0.2274 (1.1754) lr 9.3721e-04 eta 20:52:40
epoch [32/50] batch [1520/2000] time 2.073 (2.059) data 0.000 (0.001) loss 0.7337 (1.1749) lr 9.3721e-04 eta 20:51:51
epoch [32/50] batch [1540/2000] time 2.059 (2.059) data 0.000 (0.001) loss 0.4602 (1.1722) lr 9.3721e-04 eta 20:51:03
epoch [32/50] batch [1560/2000] time 2.018 (2.059) data 0.000 (0.001) loss 1.1583 (1.1722) lr 9.3721e-04 eta 20:50:16
epoch [32/50] batch [1580/2000] time 2.072 (2.058) data 0.000 (0.001) loss 1.2283 (1.1701) lr 9.3721e-04 eta 20:49:28
epoch [32/50] batch [1600/2000] time 2.010 (2.058) data 0.000 (0.001) loss 3.5446 (1.1674) lr 9.3721e-04 eta 20:48:40
epoch [32/50] batch [1620/2000] time 2.036 (2.058) data 0.000 (0.001) loss 0.8079 (1.1671) lr 9.3721e-04 eta 20:47:52
epoch [32/50] batch [1640/2000] time 2.063 (2.058) data 0.000 (0.001) loss 1.4835 (1.1729) lr 9.3721e-04 eta 20:47:04
epoch [32/50] batch [1660/2000] time 2.056 (2.058) data 0.000 (0.001) loss 0.9725 (1.1726) lr 9.3721e-04 eta 20:46:17
epoch [32/50] batch [1680/2000] time 2.061 (2.057) data 0.001 (0.001) loss 0.9471 (1.1757) lr 9.3721e-04 eta 20:45:27
epoch [32/50] batch [1700/2000] time 2.060 (2.057) data 0.000 (0.001) loss 0.8024 (1.1738) lr 9.3721e-04 eta 20:44:38
epoch [32/50] batch [1720/2000] time 2.064 (2.057) data 0.000 (0.001) loss 0.3947 (1.1727) lr 9.3721e-04 eta 20:43:49
epoch [32/50] batch [1740/2000] time 2.037 (2.057) data 0.000 (0.001) loss 0.0704 (1.1774) lr 9.3721e-04 eta 20:43:02
epoch [32/50] batch [1760/2000] time 2.009 (2.057) data 0.000 (0.001) loss 2.4080 (1.1799) lr 9.3721e-04 eta 20:42:14
epoch [32/50] batch [1780/2000] time 2.039 (2.057) data 0.000 (0.001) loss 0.7216 (1.1778) lr 9.3721e-04 eta 20:41:26
epoch [32/50] batch [1800/2000] time 2.021 (2.056) data 0.000 (0.001) loss 0.8592 (1.1728) lr 9.3721e-04 eta 20:40:41
epoch [32/50] batch [1820/2000] time 2.008 (2.056) data 0.000 (0.001) loss 0.6611 (1.1682) lr 9.3721e-04 eta 20:39:52
epoch [32/50] batch [1840/2000] time 2.065 (2.056) data 0.000 (0.001) loss 1.1590 (1.1646) lr 9.3721e-04 eta 20:39:07
epoch [32/50] batch [1860/2000] time 2.007 (2.056) data 0.000 (0.001) loss 1.1315 (1.1654) lr 9.3721e-04 eta 20:38:17
epoch [32/50] batch [1880/2000] time 2.067 (2.056) data 0.000 (0.001) loss 0.2744 (1.1639) lr 9.3721e-04 eta 20:37:33
epoch [32/50] batch [1900/2000] time 2.042 (2.056) data 0.000 (0.001) loss 3.3513 (1.1667) lr 9.3721e-04 eta 20:36:47
epoch [32/50] batch [1920/2000] time 2.007 (2.056) data 0.000 (0.001) loss 0.7712 (1.1679) lr 9.3721e-04 eta 20:36:19
epoch [32/50] batch [1940/2000] time 2.063 (2.056) data 0.000 (0.001) loss 3.2524 (1.1673) lr 9.3721e-04 eta 20:35:51
epoch [32/50] batch [1960/2000] time 1.995 (2.057) data 0.000 (0.001) loss 0.0346 (1.1659) lr 9.3721e-04 eta 20:35:25
epoch [32/50] batch [1980/2000] time 2.093 (2.057) data 0.000 (0.001) loss 1.3594 (1.1676) lr 9.3721e-04 eta 20:34:56
epoch [32/50] batch [2000/2000] time 2.166 (2.057) data 0.000 (0.001) loss 0.3136 (1.1705) lr 8.7467e-04 eta 20:34:24
epoch [33/50] batch [20/2000] time 2.063 (2.084) data 0.000 (0.028) loss 0.8722 (1.3188) lr 8.7467e-04 eta 20:49:35
epoch [33/50] batch [40/2000] time 2.062 (2.063) data 0.000 (0.014) loss 0.1492 (1.1181) lr 8.7467e-04 eta 20:36:28
epoch [33/50] batch [60/2000] time 2.042 (2.058) data 0.001 (0.009) loss 1.5103 (1.1609) lr 8.7467e-04 eta 20:32:40
epoch [33/50] batch [80/2000] time 2.044 (2.056) data 0.000 (0.007) loss 1.3866 (1.1259) lr 8.7467e-04 eta 20:30:33
epoch [33/50] batch [100/2000] time 2.011 (2.053) data 0.000 (0.006) loss 2.5722 (1.1760) lr 8.7467e-04 eta 20:28:36
epoch [33/50] batch [120/2000] time 2.015 (2.053) data 0.000 (0.005) loss 0.6267 (1.1701) lr 8.7467e-04 eta 20:27:52
epoch [33/50] batch [140/2000] time 2.143 (2.053) data 0.000 (0.004) loss 1.9007 (1.1448) lr 8.7467e-04 eta 20:27:08
epoch [33/50] batch [160/2000] time 2.043 (2.057) data 0.000 (0.004) loss 1.1112 (1.1356) lr 8.7467e-04 eta 20:28:47
epoch [33/50] batch [180/2000] time 2.064 (2.061) data 0.000 (0.003) loss 0.8128 (1.1345) lr 8.7467e-04 eta 20:30:33
epoch [33/50] batch [200/2000] time 2.042 (2.065) data 0.000 (0.003) loss 0.4139 (1.0988) lr 8.7467e-04 eta 20:31:51
epoch [33/50] batch [220/2000] time 2.011 (2.063) data 0.000 (0.003) loss 2.6475 (1.0890) lr 8.7467e-04 eta 20:30:00
epoch [33/50] batch [240/2000] time 2.131 (2.066) data 0.000 (0.003) loss 0.1079 (1.1055) lr 8.7467e-04 eta 20:31:05
epoch [33/50] batch [260/2000] time 2.022 (2.065) data 0.000 (0.002) loss 0.3989 (1.1425) lr 8.7467e-04 eta 20:29:45
epoch [33/50] batch [280/2000] time 2.067 (2.066) data 0.000 (0.002) loss 1.7252 (1.1430) lr 8.7467e-04 eta 20:29:47
epoch [33/50] batch [300/2000] time 2.015 (2.064) data 0.000 (0.002) loss 2.9221 (1.1694) lr 8.7467e-04 eta 20:28:20
epoch [33/50] batch [320/2000] time 2.153 (2.064) data 0.000 (0.002) loss 1.6557 (1.1704) lr 8.7467e-04 eta 20:27:16
epoch [33/50] batch [340/2000] time 1.984 (2.064) data 0.000 (0.002) loss 1.0445 (1.1920) lr 8.7467e-04 eta 20:26:58
epoch [33/50] batch [360/2000] time 2.058 (2.066) data 0.000 (0.002) loss 0.5905 (1.1902) lr 8.7467e-04 eta 20:26:58
epoch [33/50] batch [380/2000] time 2.009 (2.066) data 0.000 (0.002) loss 0.6745 (1.2103) lr 8.7467e-04 eta 20:26:46
epoch [33/50] batch [400/2000] time 2.013 (2.068) data 0.000 (0.002) loss 1.6182 (1.1940) lr 8.7467e-04 eta 20:26:55
epoch [33/50] batch [420/2000] time 2.048 (2.069) data 0.000 (0.002) loss 0.7863 (1.1948) lr 8.7467e-04 eta 20:27:09
epoch [33/50] batch [440/2000] time 2.014 (2.070) data 0.000 (0.002) loss 2.3548 (1.1895) lr 8.7467e-04 eta 20:26:55
epoch [33/50] batch [460/2000] time 1.991 (2.069) data 0.000 (0.001) loss 1.3694 (1.1765) lr 8.7467e-04 eta 20:25:36
epoch [33/50] batch [480/2000] time 2.070 (2.068) data 0.000 (0.001) loss 0.1112 (1.1894) lr 8.7467e-04 eta 20:24:19
epoch [33/50] batch [500/2000] time 2.042 (2.067) data 0.000 (0.001) loss 0.5232 (1.1783) lr 8.7467e-04 eta 20:23:11
epoch [33/50] batch [520/2000] time 2.063 (2.067) data 0.000 (0.001) loss 0.2374 (1.1818) lr 8.7467e-04 eta 20:22:07
epoch [33/50] batch [540/2000] time 2.008 (2.066) data 0.000 (0.001) loss 1.4134 (1.1854) lr 8.7467e-04 eta 20:20:53
epoch [33/50] batch [560/2000] time 2.063 (2.065) data 0.000 (0.001) loss 1.6245 (1.1870) lr 8.7467e-04 eta 20:19:38
epoch [33/50] batch [580/2000] time 2.210 (2.065) data 0.000 (0.001) loss 3.0470 (1.1892) lr 8.7467e-04 eta 20:19:02
epoch [33/50] batch [600/2000] time 2.020 (2.065) data 0.001 (0.001) loss 1.7183 (1.1868) lr 8.7467e-04 eta 20:18:28
epoch [33/50] batch [620/2000] time 2.068 (2.066) data 0.000 (0.001) loss 0.5784 (1.1805) lr 8.7467e-04 eta 20:18:14
epoch [33/50] batch [640/2000] time 2.060 (2.067) data 0.000 (0.001) loss 0.3192 (1.1747) lr 8.7467e-04 eta 20:18:02
epoch [33/50] batch [660/2000] time 2.040 (2.066) data 0.000 (0.001) loss 2.2478 (1.1804) lr 8.7467e-04 eta 20:16:55
epoch [33/50] batch [680/2000] time 2.060 (2.067) data 0.000 (0.001) loss 0.4727 (1.1837) lr 8.7467e-04 eta 20:16:34
epoch [33/50] batch [700/2000] time 2.341 (2.067) data 0.000 (0.001) loss 2.6604 (1.1929) lr 8.7467e-04 eta 20:15:51
epoch [33/50] batch [720/2000] time 2.025 (2.067) data 0.000 (0.001) loss 1.2183 (1.1811) lr 8.7467e-04 eta 20:15:27
epoch [33/50] batch [740/2000] time 2.062 (2.067) data 0.000 (0.001) loss 0.1256 (1.1816) lr 8.7467e-04 eta 20:14:33
epoch [33/50] batch [760/2000] time 2.073 (2.067) data 0.000 (0.001) loss 1.4600 (1.1837) lr 8.7467e-04 eta 20:14:17
epoch [33/50] batch [780/2000] time 2.041 (2.068) data 0.000 (0.001) loss 0.9681 (1.1832) lr 8.7467e-04 eta 20:14:02
epoch [33/50] batch [800/2000] time 2.115 (2.068) data 0.000 (0.001) loss 1.8579 (1.1776) lr 8.7467e-04 eta 20:13:26
epoch [33/50] batch [820/2000] time 2.116 (2.069) data 0.000 (0.001) loss 0.1458 (1.1779) lr 8.7467e-04 eta 20:13:06
epoch [33/50] batch [840/2000] time 2.165 (2.070) data 0.000 (0.001) loss 2.8123 (1.1775) lr 8.7467e-04 eta 20:12:45
epoch [33/50] batch [860/2000] time 2.035 (2.070) data 0.000 (0.001) loss 0.9519 (1.1749) lr 8.7467e-04 eta 20:12:12
epoch [33/50] batch [880/2000] time 2.044 (2.070) data 0.000 (0.001) loss 0.5447 (1.1774) lr 8.7467e-04 eta 20:11:36
epoch [33/50] batch [900/2000] time 2.042 (2.070) data 0.000 (0.001) loss 2.2077 (1.1707) lr 8.7467e-04 eta 20:10:39
epoch [33/50] batch [920/2000] time 2.098 (2.069) data 0.000 (0.001) loss 0.9983 (1.1700) lr 8.7467e-04 eta 20:09:48
epoch [33/50] batch [940/2000] time 2.018 (2.069) data 0.000 (0.001) loss 0.0426 (1.1704) lr 8.7467e-04 eta 20:08:54
epoch [33/50] batch [960/2000] time 1.991 (2.068) data 0.000 (0.001) loss 0.6367 (1.1687) lr 8.7467e-04 eta 20:07:55
epoch [33/50] batch [980/2000] time 2.065 (2.068) data 0.001 (0.001) loss 0.5853 (1.1723) lr 8.7467e-04 eta 20:06:54
epoch [33/50] batch [1000/2000] time 2.081 (2.068) data 0.000 (0.001) loss 0.0293 (1.1651) lr 8.7467e-04 eta 20:06:06
epoch [33/50] batch [1020/2000] time 2.026 (2.068) data 0.000 (0.001) loss 0.0520 (1.1671) lr 8.7467e-04 eta 20:05:39
epoch [33/50] batch [1040/2000] time 2.042 (2.069) data 0.000 (0.001) loss 0.9067 (1.1699) lr 8.7467e-04 eta 20:05:27
epoch [33/50] batch [1060/2000] time 2.077 (2.070) data 0.000 (0.001) loss 1.3035 (1.1699) lr 8.7467e-04 eta 20:05:14
epoch [33/50] batch [1080/2000] time 2.082 (2.069) data 0.000 (0.001) loss 1.1120 (1.1645) lr 8.7467e-04 eta 20:04:17
epoch [33/50] batch [1100/2000] time 2.181 (2.069) data 0.000 (0.001) loss 0.1614 (1.1666) lr 8.7467e-04 eta 20:03:31
epoch [33/50] batch [1120/2000] time 2.023 (2.069) data 0.000 (0.001) loss 0.1459 (1.1694) lr 8.7467e-04 eta 20:02:59
epoch [33/50] batch [1140/2000] time 2.112 (2.070) data 0.001 (0.001) loss 1.3751 (1.1656) lr 8.7467e-04 eta 20:02:37
epoch [33/50] batch [1160/2000] time 2.076 (2.070) data 0.000 (0.001) loss 1.2738 (1.1704) lr 8.7467e-04 eta 20:01:54
epoch [33/50] batch [1180/2000] time 2.129 (2.070) data 0.001 (0.001) loss 1.0363 (1.1699) lr 8.7467e-04 eta 20:01:17
epoch [33/50] batch [1200/2000] time 2.063 (2.070) data 0.000 (0.001) loss 0.2489 (1.1690) lr 8.7467e-04 eta 20:00:28
epoch [33/50] batch [1220/2000] time 2.058 (2.069) data 0.000 (0.001) loss 0.2754 (1.1706) lr 8.7467e-04 eta 19:59:35
epoch [33/50] batch [1240/2000] time 2.036 (2.069) data 0.000 (0.001) loss 0.2021 (1.1694) lr 8.7467e-04 eta 19:58:37
epoch [33/50] batch [1260/2000] time 2.060 (2.069) data 0.000 (0.001) loss 0.4870 (1.1679) lr 8.7467e-04 eta 19:57:40
epoch [33/50] batch [1280/2000] time 2.063 (2.068) data 0.000 (0.001) loss 0.5149 (1.1656) lr 8.7467e-04 eta 19:56:46
epoch [33/50] batch [1300/2000] time 2.062 (2.068) data 0.000 (0.001) loss 0.2716 (1.1721) lr 8.7467e-04 eta 19:55:49
epoch [33/50] batch [1320/2000] time 2.015 (2.067) data 0.000 (0.001) loss 0.4016 (1.1691) lr 8.7467e-04 eta 19:54:55
epoch [33/50] batch [1340/2000] time 2.061 (2.067) data 0.000 (0.001) loss 0.9174 (1.1724) lr 8.7467e-04 eta 19:54:05
epoch [33/50] batch [1360/2000] time 2.007 (2.067) data 0.000 (0.001) loss 5.4085 (1.1766) lr 8.7467e-04 eta 19:53:13
epoch [33/50] batch [1380/2000] time 2.073 (2.066) data 0.000 (0.001) loss 0.2233 (1.1804) lr 8.7467e-04 eta 19:52:22
epoch [33/50] batch [1400/2000] time 1.986 (2.066) data 0.000 (0.001) loss 1.3219 (1.1768) lr 8.7467e-04 eta 19:51:30
epoch [33/50] batch [1420/2000] time 2.063 (2.066) data 0.000 (0.001) loss 2.7927 (1.1821) lr 8.7467e-04 eta 19:50:34
epoch [33/50] batch [1440/2000] time 2.036 (2.065) data 0.000 (0.001) loss 1.2377 (1.1839) lr 8.7467e-04 eta 19:49:38
epoch [33/50] batch [1460/2000] time 2.068 (2.065) data 0.000 (0.001) loss 1.6848 (1.1791) lr 8.7467e-04 eta 19:48:46
epoch [33/50] batch [1480/2000] time 2.019 (2.065) data 0.000 (0.001) loss 1.6077 (1.1799) lr 8.7467e-04 eta 19:47:55
epoch [33/50] batch [1500/2000] time 2.011 (2.064) data 0.000 (0.001) loss 1.0343 (1.1769) lr 8.7467e-04 eta 19:47:02
epoch [33/50] batch [1520/2000] time 2.009 (2.064) data 0.000 (0.001) loss 1.2876 (1.1802) lr 8.7467e-04 eta 19:46:10
epoch [33/50] batch [1540/2000] time 2.010 (2.064) data 0.000 (0.001) loss 0.1736 (1.1756) lr 8.7467e-04 eta 19:45:16
epoch [33/50] batch [1560/2000] time 2.038 (2.064) data 0.000 (0.001) loss 1.3569 (1.1754) lr 8.7467e-04 eta 19:44:28
epoch [33/50] batch [1580/2000] time 2.074 (2.063) data 0.000 (0.001) loss 2.4075 (1.1785) lr 8.7467e-04 eta 19:43:39
epoch [33/50] batch [1600/2000] time 2.019 (2.063) data 0.000 (0.001) loss 1.5606 (1.1768) lr 8.7467e-04 eta 19:42:49
epoch [33/50] batch [1620/2000] time 2.063 (2.063) data 0.000 (0.001) loss 2.0550 (1.1736) lr 8.7467e-04 eta 19:41:58
epoch [33/50] batch [1640/2000] time 2.072 (2.062) data 0.000 (0.001) loss 2.7969 (1.1700) lr 8.7467e-04 eta 19:41:06
epoch [33/50] batch [1660/2000] time 2.040 (2.062) data 0.000 (0.001) loss 0.3302 (1.1702) lr 8.7467e-04 eta 19:40:13
epoch [33/50] batch [1680/2000] time 2.061 (2.062) data 0.001 (0.001) loss 1.4154 (1.1673) lr 8.7467e-04 eta 19:39:25
epoch [33/50] batch [1700/2000] time 2.016 (2.062) data 0.000 (0.001) loss 1.0278 (1.1669) lr 8.7467e-04 eta 19:38:34
epoch [33/50] batch [1720/2000] time 2.070 (2.061) data 0.000 (0.001) loss 0.7629 (1.1625) lr 8.7467e-04 eta 19:37:46
epoch [33/50] batch [1740/2000] time 2.057 (2.061) data 0.000 (0.001) loss 1.1964 (1.1638) lr 8.7467e-04 eta 19:37:01
epoch [33/50] batch [1760/2000] time 1.993 (2.061) data 0.000 (0.001) loss 3.0565 (1.1644) lr 8.7467e-04 eta 19:36:12
epoch [33/50] batch [1780/2000] time 2.007 (2.061) data 0.000 (0.001) loss 0.6084 (1.1617) lr 8.7467e-04 eta 19:35:24
epoch [33/50] batch [1800/2000] time 2.062 (2.061) data 0.000 (0.001) loss 2.4672 (1.1620) lr 8.7467e-04 eta 19:34:35
epoch [33/50] batch [1820/2000] time 2.042 (2.061) data 0.000 (0.001) loss 3.4984 (1.1649) lr 8.7467e-04 eta 19:33:47
epoch [33/50] batch [1840/2000] time 2.065 (2.060) data 0.000 (0.001) loss 0.0602 (1.1618) lr 8.7467e-04 eta 19:33:00
epoch [33/50] batch [1860/2000] time 2.043 (2.060) data 0.000 (0.001) loss 5.0533 (1.1634) lr 8.7467e-04 eta 19:32:14
epoch [33/50] batch [1880/2000] time 2.008 (2.060) data 0.000 (0.001) loss 1.3618 (1.1629) lr 8.7467e-04 eta 19:31:26
epoch [33/50] batch [1900/2000] time 2.013 (2.060) data 0.000 (0.001) loss 4.4833 (1.1642) lr 8.7467e-04 eta 19:30:41
epoch [33/50] batch [1920/2000] time 2.081 (2.060) data 0.000 (0.001) loss 0.8182 (1.1646) lr 8.7467e-04 eta 19:29:54
epoch [33/50] batch [1940/2000] time 2.011 (2.060) data 0.000 (0.001) loss 1.5523 (1.1706) lr 8.7467e-04 eta 19:29:08
epoch [33/50] batch [1960/2000] time 2.063 (2.059) data 0.000 (0.001) loss 0.6529 (1.1705) lr 8.7467e-04 eta 19:28:21
epoch [33/50] batch [1980/2000] time 2.067 (2.059) data 0.000 (0.001) loss 1.8308 (1.1702) lr 8.7467e-04 eta 19:27:33
epoch [33/50] batch [2000/2000] time 2.063 (2.059) data 0.000 (0.001) loss 0.5883 (1.1672) lr 8.1262e-04 eta 19:26:48
epoch [34/50] batch [20/2000] time 2.048 (2.074) data 0.000 (0.029) loss 1.7834 (1.5717) lr 8.1262e-04 eta 19:34:23
epoch [34/50] batch [40/2000] time 2.071 (2.064) data 0.000 (0.015) loss 0.4906 (1.3732) lr 8.1262e-04 eta 19:28:01
epoch [34/50] batch [60/2000] time 1.989 (2.054) data 0.001 (0.010) loss 0.8292 (1.2617) lr 8.1262e-04 eta 19:21:57
epoch [34/50] batch [80/2000] time 2.064 (2.052) data 0.000 (0.007) loss 0.1725 (1.2622) lr 8.1262e-04 eta 19:19:57
epoch [34/50] batch [100/2000] time 2.010 (2.050) data 0.000 (0.006) loss 0.1672 (1.2002) lr 8.1262e-04 eta 19:18:01
epoch [34/50] batch [120/2000] time 2.018 (2.049) data 0.000 (0.005) loss 1.4229 (1.2458) lr 8.1262e-04 eta 19:17:02
epoch [34/50] batch [140/2000] time 1.988 (2.048) data 0.000 (0.004) loss 0.3345 (1.2780) lr 8.1262e-04 eta 19:15:36
epoch [34/50] batch [160/2000] time 2.048 (2.048) data 0.004 (0.004) loss 4.1729 (1.2202) lr 8.1262e-04 eta 19:14:52
epoch [34/50] batch [180/2000] time 2.082 (2.048) data 0.000 (0.003) loss 0.7344 (1.2158) lr 8.1262e-04 eta 19:14:24
epoch [34/50] batch [200/2000] time 2.042 (2.048) data 0.000 (0.003) loss 0.7428 (1.2340) lr 8.1262e-04 eta 19:13:34
epoch [34/50] batch [220/2000] time 2.009 (2.047) data 0.000 (0.003) loss 0.4402 (1.2032) lr 8.1262e-04 eta 19:12:38
epoch [34/50] batch [240/2000] time 2.068 (2.047) data 0.000 (0.003) loss 2.7023 (1.2076) lr 8.1262e-04 eta 19:11:48
epoch [34/50] batch [260/2000] time 2.010 (2.047) data 0.000 (0.003) loss 0.4284 (1.2010) lr 8.1262e-04 eta 19:10:55
epoch [34/50] batch [280/2000] time 2.016 (2.047) data 0.000 (0.002) loss 0.2699 (1.1944) lr 8.1262e-04 eta 19:10:26
epoch [34/50] batch [300/2000] time 2.070 (2.047) data 0.000 (0.002) loss 0.0342 (1.1955) lr 8.1262e-04 eta 19:09:39
epoch [34/50] batch [320/2000] time 2.076 (2.047) data 0.000 (0.002) loss 2.7344 (1.1838) lr 8.1262e-04 eta 19:09:07
epoch [34/50] batch [340/2000] time 1.988 (2.047) data 0.000 (0.002) loss 2.0271 (1.1769) lr 8.1262e-04 eta 19:08:12
epoch [34/50] batch [360/2000] time 2.075 (2.047) data 0.000 (0.002) loss 1.1985 (1.1540) lr 8.1262e-04 eta 19:07:39
epoch [34/50] batch [380/2000] time 2.070 (2.047) data 0.000 (0.002) loss 1.0879 (1.1508) lr 8.1262e-04 eta 19:07:05
epoch [34/50] batch [400/2000] time 2.071 (2.047) data 0.000 (0.002) loss 2.0062 (1.1571) lr 8.1262e-04 eta 19:06:30
epoch [34/50] batch [420/2000] time 2.015 (2.047) data 0.000 (0.002) loss 2.1360 (1.1461) lr 8.1262e-04 eta 19:05:52
epoch [34/50] batch [440/2000] time 2.069 (2.048) data 0.000 (0.002) loss 0.3337 (1.1360) lr 8.1262e-04 eta 19:05:32
epoch [34/50] batch [460/2000] time 2.018 (2.048) data 0.000 (0.002) loss 0.8269 (1.1646) lr 8.1262e-04 eta 19:05:03
epoch [34/50] batch [480/2000] time 2.071 (2.049) data 0.000 (0.002) loss 0.0436 (1.1560) lr 8.1262e-04 eta 19:04:31
epoch [34/50] batch [500/2000] time 1.985 (2.049) data 0.000 (0.001) loss 1.7100 (1.1417) lr 8.1262e-04 eta 19:03:48
epoch [34/50] batch [520/2000] time 2.022 (2.049) data 0.000 (0.001) loss 0.8524 (1.1505) lr 8.1262e-04 eta 19:03:05
epoch [34/50] batch [540/2000] time 2.066 (2.049) data 0.000 (0.001) loss 0.1703 (1.1376) lr 8.1262e-04 eta 19:02:29
epoch [34/50] batch [560/2000] time 2.068 (2.048) data 0.000 (0.001) loss 0.1504 (1.1376) lr 8.1262e-04 eta 19:01:35
epoch [34/50] batch [580/2000] time 2.008 (2.048) data 0.000 (0.001) loss 0.5954 (1.1305) lr 8.1262e-04 eta 19:00:45
epoch [34/50] batch [600/2000] time 2.042 (2.048) data 0.001 (0.001) loss 0.7610 (1.1304) lr 8.1262e-04 eta 18:59:56
epoch [34/50] batch [620/2000] time 2.066 (2.047) data 0.000 (0.001) loss 1.8301 (1.1287) lr 8.1262e-04 eta 18:59:04
epoch [34/50] batch [640/2000] time 2.044 (2.047) data 0.000 (0.001) loss 0.3267 (1.1309) lr 8.1262e-04 eta 18:58:16
epoch [34/50] batch [660/2000] time 2.025 (2.047) data 0.000 (0.001) loss 1.0378 (1.1364) lr 8.1262e-04 eta 18:57:34
epoch [34/50] batch [680/2000] time 2.064 (2.047) data 0.000 (0.001) loss 0.8446 (1.1312) lr 8.1262e-04 eta 18:56:54
epoch [34/50] batch [700/2000] time 2.046 (2.047) data 0.000 (0.001) loss 0.2819 (1.1241) lr 8.1262e-04 eta 18:56:07
epoch [34/50] batch [720/2000] time 2.046 (2.047) data 0.001 (0.001) loss 1.3561 (1.1375) lr 8.1262e-04 eta 18:55:20
epoch [34/50] batch [740/2000] time 2.052 (2.047) data 0.002 (0.001) loss 2.3029 (1.1389) lr 8.1262e-04 eta 18:54:36
epoch [34/50] batch [760/2000] time 2.063 (2.047) data 0.000 (0.001) loss 1.2658 (1.1336) lr 8.1262e-04 eta 18:54:01
epoch [34/50] batch [780/2000] time 2.067 (2.047) data 0.000 (0.001) loss 0.2167 (1.1295) lr 8.1262e-04 eta 18:53:18
epoch [34/50] batch [800/2000] time 2.000 (2.047) data 0.000 (0.001) loss 2.3533 (1.1323) lr 8.1262e-04 eta 18:52:33
epoch [34/50] batch [820/2000] time 2.013 (2.047) data 0.000 (0.001) loss 1.4862 (1.1346) lr 8.1262e-04 eta 18:51:49
epoch [34/50] batch [840/2000] time 2.071 (2.047) data 0.000 (0.001) loss 0.8174 (1.1341) lr 8.1262e-04 eta 18:51:05
epoch [34/50] batch [860/2000] time 2.075 (2.046) data 0.000 (0.001) loss 0.7787 (1.1393) lr 8.1262e-04 eta 18:50:20
epoch [34/50] batch [880/2000] time 2.065 (2.047) data 0.000 (0.001) loss 1.3486 (1.1355) lr 8.1262e-04 eta 18:49:41
epoch [34/50] batch [900/2000] time 2.069 (2.047) data 0.003 (0.001) loss 1.7115 (1.1351) lr 8.1262e-04 eta 18:49:01
epoch [34/50] batch [920/2000] time 2.067 (2.047) data 0.000 (0.001) loss 0.4420 (1.1335) lr 8.1262e-04 eta 18:48:23
epoch [34/50] batch [940/2000] time 2.046 (2.047) data 0.000 (0.001) loss 0.1558 (1.1343) lr 8.1262e-04 eta 18:47:38
epoch [34/50] batch [960/2000] time 2.071 (2.047) data 0.000 (0.001) loss 3.0011 (1.1404) lr 8.1262e-04 eta 18:46:58
epoch [34/50] batch [980/2000] time 2.066 (2.047) data 0.000 (0.001) loss 0.1430 (1.1419) lr 8.1262e-04 eta 18:46:20
epoch [34/50] batch [1000/2000] time 1.984 (2.047) data 0.000 (0.001) loss 0.1757 (1.1381) lr 8.1262e-04 eta 18:45:37
epoch [34/50] batch [1020/2000] time 1.999 (2.046) data 0.000 (0.001) loss 0.2282 (1.1385) lr 8.1262e-04 eta 18:44:51
epoch [34/50] batch [1040/2000] time 2.066 (2.046) data 0.000 (0.001) loss 1.3483 (1.1351) lr 8.1262e-04 eta 18:44:08
epoch [34/50] batch [1060/2000] time 2.071 (2.046) data 0.000 (0.001) loss 0.4466 (1.1336) lr 8.1262e-04 eta 18:43:28
epoch [34/50] batch [1080/2000] time 2.044 (2.046) data 0.000 (0.001) loss 0.4903 (1.1369) lr 8.1262e-04 eta 18:42:47
epoch [34/50] batch [1100/2000] time 2.048 (2.046) data 0.000 (0.001) loss 0.1106 (1.1304) lr 8.1262e-04 eta 18:42:09
epoch [34/50] batch [1120/2000] time 2.042 (2.046) data 0.000 (0.001) loss 0.6986 (1.1295) lr 8.1262e-04 eta 18:41:24
epoch [34/50] batch [1140/2000] time 2.014 (2.046) data 0.001 (0.001) loss 0.9584 (1.1292) lr 8.1262e-04 eta 18:40:42
epoch [34/50] batch [1160/2000] time 2.069 (2.046) data 0.000 (0.001) loss 1.2626 (1.1310) lr 8.1262e-04 eta 18:40:05
epoch [34/50] batch [1180/2000] time 2.070 (2.046) data 0.000 (0.001) loss 1.7494 (1.1292) lr 8.1262e-04 eta 18:39:23
epoch [34/50] batch [1200/2000] time 2.019 (2.046) data 0.000 (0.001) loss 1.3551 (1.1276) lr 8.1262e-04 eta 18:38:42
epoch [34/50] batch [1220/2000] time 2.065 (2.046) data 0.000 (0.001) loss 0.6754 (1.1230) lr 8.1262e-04 eta 18:38:00
epoch [34/50] batch [1240/2000] time 2.068 (2.046) data 0.000 (0.001) loss 0.7065 (1.1214) lr 8.1262e-04 eta 18:37:22
epoch [34/50] batch [1260/2000] time 2.045 (2.046) data 0.000 (0.001) loss 0.6435 (1.1235) lr 8.1262e-04 eta 18:36:38
epoch [34/50] batch [1280/2000] time 2.062 (2.046) data 0.000 (0.001) loss 0.0767 (1.1177) lr 8.1262e-04 eta 18:35:58
epoch [34/50] batch [1300/2000] time 2.010 (2.046) data 0.000 (0.001) loss 1.0412 (1.1133) lr 8.1262e-04 eta 18:35:12
epoch [34/50] batch [1320/2000] time 2.043 (2.046) data 0.000 (0.001) loss 0.4714 (1.1092) lr 8.1262e-04 eta 18:34:28
epoch [34/50] batch [1340/2000] time 2.074 (2.046) data 0.000 (0.001) loss 0.9935 (1.1133) lr 8.1262e-04 eta 18:33:49
epoch [34/50] batch [1360/2000] time 2.040 (2.046) data 0.000 (0.001) loss 0.3427 (1.1130) lr 8.1262e-04 eta 18:33:08
epoch [34/50] batch [1380/2000] time 2.068 (2.046) data 0.000 (0.001) loss 1.7819 (1.1201) lr 8.1262e-04 eta 18:32:25
epoch [34/50] batch [1400/2000] time 2.064 (2.046) data 0.000 (0.001) loss 1.5061 (1.1229) lr 8.1262e-04 eta 18:31:43
epoch [34/50] batch [1420/2000] time 2.067 (2.046) data 0.000 (0.001) loss 1.1011 (1.1228) lr 8.1262e-04 eta 18:31:04
epoch [34/50] batch [1440/2000] time 2.045 (2.046) data 0.000 (0.001) loss 1.6668 (1.1203) lr 8.1262e-04 eta 18:30:27
epoch [34/50] batch [1460/2000] time 2.050 (2.046) data 0.000 (0.001) loss 0.8354 (1.1201) lr 8.1262e-04 eta 18:29:52
epoch [34/50] batch [1480/2000] time 2.069 (2.046) data 0.000 (0.001) loss 1.8724 (1.1230) lr 8.1262e-04 eta 18:29:09
epoch [34/50] batch [1500/2000] time 2.051 (2.047) data 0.000 (0.001) loss 0.1350 (1.1239) lr 8.1262e-04 eta 18:28:34
epoch [34/50] batch [1520/2000] time 2.044 (2.047) data 0.000 (0.001) loss 0.8579 (1.1198) lr 8.1262e-04 eta 18:27:55
epoch [34/50] batch [1540/2000] time 2.065 (2.047) data 0.000 (0.001) loss 0.4314 (1.1206) lr 8.1262e-04 eta 18:27:19
epoch [34/50] batch [1560/2000] time 2.011 (2.047) data 0.000 (0.001) loss 0.0729 (1.1200) lr 8.1262e-04 eta 18:26:38
epoch [34/50] batch [1580/2000] time 2.070 (2.047) data 0.000 (0.001) loss 2.1977 (1.1195) lr 8.1262e-04 eta 18:25:57
epoch [34/50] batch [1600/2000] time 2.068 (2.047) data 0.000 (0.001) loss 0.4262 (1.1183) lr 8.1262e-04 eta 18:25:16
epoch [34/50] batch [1620/2000] time 2.096 (2.047) data 0.005 (0.001) loss 0.6327 (1.1183) lr 8.1262e-04 eta 18:24:39
epoch [34/50] batch [1640/2000] time 1.989 (2.047) data 0.000 (0.001) loss 0.0261 (1.1163) lr 8.1262e-04 eta 18:23:57
epoch [34/50] batch [1660/2000] time 2.061 (2.047) data 0.000 (0.001) loss 1.1271 (1.1177) lr 8.1262e-04 eta 18:23:15
epoch [34/50] batch [1680/2000] time 2.044 (2.047) data 0.001 (0.001) loss 0.1253 (1.1193) lr 8.1262e-04 eta 18:22:32
epoch [34/50] batch [1700/2000] time 2.070 (2.047) data 0.000 (0.001) loss 0.4750 (1.1257) lr 8.1262e-04 eta 18:21:52
epoch [34/50] batch [1720/2000] time 2.067 (2.047) data 0.000 (0.001) loss 1.3117 (1.1267) lr 8.1262e-04 eta 18:21:08
epoch [34/50] batch [1740/2000] time 2.046 (2.047) data 0.000 (0.001) loss 0.0097 (1.1246) lr 8.1262e-04 eta 18:20:25
epoch [34/50] batch [1760/2000] time 2.067 (2.047) data 0.001 (0.001) loss 0.6310 (1.1219) lr 8.1262e-04 eta 18:19:45
epoch [34/50] batch [1780/2000] time 2.072 (2.047) data 0.000 (0.001) loss 0.2473 (1.1246) lr 8.1262e-04 eta 18:19:06
epoch [34/50] batch [1800/2000] time 2.013 (2.047) data 0.000 (0.001) loss 0.2131 (1.1229) lr 8.1262e-04 eta 18:18:26
epoch [34/50] batch [1820/2000] time 2.014 (2.047) data 0.000 (0.001) loss 1.3391 (1.1256) lr 8.1262e-04 eta 18:17:46
epoch [34/50] batch [1840/2000] time 2.072 (2.047) data 0.001 (0.001) loss 0.7646 (1.1264) lr 8.1262e-04 eta 18:17:09
epoch [34/50] batch [1860/2000] time 2.074 (2.047) data 0.001 (0.001) loss 1.0520 (1.1298) lr 8.1262e-04 eta 18:16:30
epoch [34/50] batch [1880/2000] time 2.071 (2.047) data 0.000 (0.001) loss 2.8315 (1.1289) lr 8.1262e-04 eta 18:15:49
epoch [34/50] batch [1900/2000] time 2.068 (2.047) data 0.000 (0.001) loss 0.3838 (1.1315) lr 8.1262e-04 eta 18:15:08
epoch [34/50] batch [1920/2000] time 2.012 (2.047) data 0.000 (0.001) loss 0.8015 (1.1301) lr 8.1262e-04 eta 18:14:27
epoch [34/50] batch [1940/2000] time 2.065 (2.047) data 0.000 (0.001) loss 1.1216 (1.1308) lr 8.1262e-04 eta 18:13:47
epoch [34/50] batch [1960/2000] time 2.012 (2.047) data 0.000 (0.001) loss 0.7037 (1.1320) lr 8.1262e-04 eta 18:13:05
epoch [34/50] batch [1980/2000] time 2.064 (2.047) data 0.000 (0.001) loss 0.3423 (1.1339) lr 8.1262e-04 eta 18:12:21
epoch [34/50] batch [2000/2000] time 2.057 (2.047) data 0.000 (0.001) loss 0.7075 (1.1382) lr 7.5131e-04 eta 18:11:37
epoch [35/50] batch [20/2000] time 2.039 (2.067) data 0.000 (0.030) loss 3.0368 (1.3608) lr 7.5131e-04 eta 18:21:41
epoch [35/50] batch [40/2000] time 2.004 (2.052) data 0.000 (0.015) loss 2.1939 (1.2312) lr 7.5131e-04 eta 18:12:54
epoch [35/50] batch [60/2000] time 2.034 (2.046) data 0.001 (0.010) loss 0.7739 (1.1674) lr 7.5131e-04 eta 18:09:15
epoch [35/50] batch [80/2000] time 2.045 (2.044) data 0.000 (0.008) loss 0.9979 (1.2012) lr 7.5131e-04 eta 18:07:17
epoch [35/50] batch [100/2000] time 2.055 (2.044) data 0.000 (0.006) loss 0.8084 (1.2000) lr 7.5131e-04 eta 18:06:40
epoch [35/50] batch [120/2000] time 2.042 (2.042) data 0.005 (0.005) loss 0.4364 (1.1776) lr 7.5131e-04 eta 18:05:07
epoch [35/50] batch [140/2000] time 2.007 (2.041) data 0.000 (0.005) loss 0.1981 (1.2387) lr 7.5131e-04 eta 18:03:42
epoch [35/50] batch [160/2000] time 2.012 (2.040) data 0.000 (0.004) loss 1.5560 (1.2319) lr 7.5131e-04 eta 18:02:37
epoch [35/50] batch [180/2000] time 2.064 (2.039) data 0.000 (0.004) loss 0.8744 (1.2270) lr 7.5131e-04 eta 18:01:26
epoch [35/50] batch [200/2000] time 2.062 (2.039) data 0.000 (0.003) loss 0.0142 (1.1983) lr 7.5131e-04 eta 18:00:41
epoch [35/50] batch [220/2000] time 2.038 (2.038) data 0.000 (0.003) loss 0.1613 (1.1793) lr 7.5131e-04 eta 17:59:34
epoch [35/50] batch [240/2000] time 2.063 (2.039) data 0.000 (0.003) loss 3.2210 (1.2120) lr 7.5131e-04 eta 17:59:12
epoch [35/50] batch [260/2000] time 2.007 (2.038) data 0.000 (0.003) loss 0.8274 (1.2261) lr 7.5131e-04 eta 17:58:16
epoch [35/50] batch [280/2000] time 2.006 (2.038) data 0.000 (0.002) loss 2.3642 (1.2270) lr 7.5131e-04 eta 17:57:36
epoch [35/50] batch [300/2000] time 2.034 (2.038) data 0.000 (0.002) loss 1.5002 (1.2343) lr 7.5131e-04 eta 17:56:52
epoch [35/50] batch [320/2000] time 2.059 (2.038) data 0.000 (0.002) loss 2.2411 (1.2143) lr 7.5131e-04 eta 17:56:13
epoch [35/50] batch [340/2000] time 2.007 (2.038) data 0.000 (0.002) loss 1.0235 (1.2166) lr 7.5131e-04 eta 17:55:26
epoch [35/50] batch [360/2000] time 2.058 (2.038) data 0.000 (0.002) loss 0.6659 (1.2100) lr 7.5131e-04 eta 17:54:37
epoch [35/50] batch [380/2000] time 2.044 (2.038) data 0.000 (0.002) loss 0.2877 (1.2049) lr 7.5131e-04 eta 17:53:46
epoch [35/50] batch [400/2000] time 2.077 (2.038) data 0.000 (0.002) loss 1.1125 (1.2056) lr 7.5131e-04 eta 17:53:17
epoch [35/50] batch [420/2000] time 2.075 (2.038) data 0.000 (0.002) loss 0.7037 (1.2134) lr 7.5131e-04 eta 17:52:44
epoch [35/50] batch [440/2000] time 2.061 (2.039) data 0.004 (0.002) loss 2.4274 (1.2033) lr 7.5131e-04 eta 17:52:19
epoch [35/50] batch [460/2000] time 2.407 (2.052) data 0.000 (0.002) loss 0.2456 (1.1886) lr 7.5131e-04 eta 17:58:34
epoch [35/50] batch [480/2000] time 2.426 (2.066) data 0.000 (0.002) loss 1.9578 (1.1811) lr 7.5131e-04 eta 18:05:29
epoch [35/50] batch [500/2000] time 1.986 (2.070) data 0.000 (0.002) loss 1.3794 (1.1790) lr 7.5131e-04 eta 18:06:57
epoch [35/50] batch [520/2000] time 2.041 (2.069) data 0.000 (0.001) loss 4.8665 (1.1949) lr 7.5131e-04 eta 18:05:44
epoch [35/50] batch [540/2000] time 2.065 (2.068) data 0.000 (0.001) loss 1.5258 (1.1936) lr 7.5131e-04 eta 18:04:29
epoch [35/50] batch [560/2000] time 2.013 (2.067) data 0.000 (0.001) loss 1.3795 (1.1905) lr 7.5131e-04 eta 18:03:17
epoch [35/50] batch [580/2000] time 2.011 (2.067) data 0.000 (0.001) loss 0.3548 (1.1782) lr 7.5131e-04 eta 18:02:16
epoch [35/50] batch [600/2000] time 2.063 (2.066) data 0.001 (0.001) loss 0.7840 (1.1821) lr 7.5131e-04 eta 18:01:12
epoch [35/50] batch [620/2000] time 2.141 (2.066) data 0.000 (0.001) loss 0.7600 (1.1799) lr 7.5131e-04 eta 18:00:21
epoch [35/50] batch [640/2000] time 2.037 (2.065) data 0.000 (0.001) loss 0.7314 (1.1661) lr 7.5131e-04 eta 17:59:19
epoch [35/50] batch [660/2000] time 2.032 (2.064) data 0.000 (0.001) loss 0.6211 (1.1622) lr 7.5131e-04 eta 17:58:14
epoch [35/50] batch [680/2000] time 2.060 (2.063) data 0.000 (0.001) loss 0.1308 (1.1665) lr 7.5131e-04 eta 17:57:08
epoch [35/50] batch [700/2000] time 2.006 (2.063) data 0.000 (0.001) loss 0.3129 (1.1626) lr 7.5131e-04 eta 17:56:06
epoch [35/50] batch [720/2000] time 2.057 (2.062) data 0.000 (0.001) loss 0.4223 (1.1593) lr 7.5131e-04 eta 17:55:03
epoch [35/50] batch [740/2000] time 2.008 (2.061) data 0.000 (0.001) loss 1.5753 (1.1632) lr 7.5131e-04 eta 17:54:00
epoch [35/50] batch [760/2000] time 2.039 (2.061) data 0.000 (0.001) loss 0.5829 (1.1670) lr 7.5131e-04 eta 17:53:02
epoch [35/50] batch [780/2000] time 2.044 (2.060) data 0.000 (0.001) loss 0.5428 (1.1614) lr 7.5131e-04 eta 17:52:03
epoch [35/50] batch [800/2000] time 2.041 (2.060) data 0.000 (0.001) loss 0.7543 (1.1662) lr 7.5131e-04 eta 17:51:08
epoch [35/50] batch [820/2000] time 2.072 (2.059) data 0.000 (0.001) loss 2.8354 (1.1659) lr 7.5131e-04 eta 17:50:07
epoch [35/50] batch [840/2000] time 2.070 (2.059) data 0.000 (0.001) loss 0.0256 (1.1664) lr 7.5131e-04 eta 17:49:16
epoch [35/50] batch [860/2000] time 2.041 (2.059) data 0.000 (0.001) loss 3.4484 (1.1758) lr 7.5131e-04 eta 17:48:29
epoch [35/50] batch [880/2000] time 2.039 (2.059) data 0.000 (0.001) loss 1.7798 (1.1671) lr 7.5131e-04 eta 17:47:43
epoch [35/50] batch [900/2000] time 2.011 (2.058) data 0.000 (0.001) loss 0.3569 (1.1678) lr 7.5131e-04 eta 17:46:51
epoch [35/50] batch [920/2000] time 2.062 (2.058) data 0.000 (0.001) loss 1.9014 (1.1741) lr 7.5131e-04 eta 17:46:00
epoch [35/50] batch [940/2000] time 1.986 (2.057) data 0.000 (0.001) loss 1.0021 (1.1762) lr 7.5131e-04 eta 17:45:05
epoch [35/50] batch [960/2000] time 2.061 (2.057) data 0.000 (0.001) loss 4.6620 (1.1795) lr 7.5131e-04 eta 17:44:12
epoch [35/50] batch [980/2000] time 2.060 (2.057) data 0.000 (0.001) loss 5.3625 (1.1798) lr 7.5131e-04 eta 17:43:17
epoch [35/50] batch [1000/2000] time 2.063 (2.056) data 0.000 (0.001) loss 0.6487 (1.1802) lr 7.5131e-04 eta 17:42:28
epoch [35/50] batch [1020/2000] time 2.065 (2.056) data 0.000 (0.001) loss 0.2438 (1.1773) lr 7.5131e-04 eta 17:41:42
epoch [35/50] batch [1040/2000] time 2.009 (2.056) data 0.000 (0.001) loss 0.3401 (1.1744) lr 7.5131e-04 eta 17:40:51
epoch [35/50] batch [1060/2000] time 2.064 (2.056) data 0.000 (0.001) loss 1.3318 (1.1749) lr 7.5131e-04 eta 17:40:02
epoch [35/50] batch [1080/2000] time 2.062 (2.055) data 0.000 (0.001) loss 0.1601 (1.1745) lr 7.5131e-04 eta 17:39:14
epoch [35/50] batch [1100/2000] time 2.038 (2.055) data 0.000 (0.001) loss 0.4102 (1.1709) lr 7.5131e-04 eta 17:38:26
epoch [35/50] batch [1120/2000] time 2.008 (2.055) data 0.000 (0.001) loss 0.5949 (1.1649) lr 7.5131e-04 eta 17:37:35
epoch [35/50] batch [1140/2000] time 2.061 (2.055) data 0.001 (0.001) loss 0.4778 (1.1627) lr 7.5131e-04 eta 17:36:48
epoch [35/50] batch [1160/2000] time 2.077 (2.055) data 0.000 (0.001) loss 1.5909 (1.1632) lr 7.5131e-04 eta 17:36:04
epoch [35/50] batch [1180/2000] time 2.052 (2.055) data 0.000 (0.001) loss 2.7302 (1.1563) lr 7.5131e-04 eta 17:35:20
epoch [35/50] batch [1200/2000] time 2.055 (2.054) data 0.000 (0.001) loss 0.5385 (1.1586) lr 7.5131e-04 eta 17:34:37
epoch [35/50] batch [1220/2000] time 2.016 (2.054) data 0.000 (0.001) loss 1.5819 (1.1558) lr 7.5131e-04 eta 17:33:51
epoch [35/50] batch [1240/2000] time 2.064 (2.054) data 0.000 (0.001) loss 1.1306 (1.1601) lr 7.5131e-04 eta 17:33:07
epoch [35/50] batch [1260/2000] time 2.019 (2.054) data 0.000 (0.001) loss 0.7050 (1.1636) lr 7.5131e-04 eta 17:32:26
epoch [35/50] batch [1280/2000] time 2.068 (2.054) data 0.001 (0.001) loss 3.4133 (1.1690) lr 7.5131e-04 eta 17:31:45
epoch [35/50] batch [1300/2000] time 2.012 (2.054) data 0.000 (0.001) loss 0.2938 (1.1663) lr 7.5131e-04 eta 17:30:58
epoch [35/50] batch [1320/2000] time 2.064 (2.054) data 0.000 (0.001) loss 0.0615 (1.1606) lr 7.5131e-04 eta 17:30:16
epoch [35/50] batch [1340/2000] time 2.078 (2.054) data 0.000 (0.001) loss 1.5466 (1.1659) lr 7.5131e-04 eta 17:29:35
epoch [35/50] batch [1360/2000] time 1.988 (2.054) data 0.000 (0.001) loss 1.0646 (1.1677) lr 7.5131e-04 eta 17:28:49
epoch [35/50] batch [1380/2000] time 2.067 (2.054) data 0.000 (0.001) loss 2.0317 (1.1750) lr 7.5131e-04 eta 17:28:04
epoch [35/50] batch [1400/2000] time 2.062 (2.054) data 0.000 (0.001) loss 1.8237 (1.1814) lr 7.5131e-04 eta 17:27:17
epoch [35/50] batch [1420/2000] time 2.062 (2.053) data 0.000 (0.001) loss 1.8225 (1.1782) lr 7.5131e-04 eta 17:26:29
epoch [35/50] batch [1440/2000] time 2.064 (2.053) data 0.000 (0.001) loss 1.3931 (1.1739) lr 7.5131e-04 eta 17:25:46
epoch [35/50] batch [1460/2000] time 2.062 (2.053) data 0.000 (0.001) loss 0.5180 (1.1708) lr 7.5131e-04 eta 17:24:57
epoch [35/50] batch [1480/2000] time 2.063 (2.053) data 0.000 (0.001) loss 2.3569 (1.1716) lr 7.5131e-04 eta 17:24:12
epoch [35/50] batch [1500/2000] time 1.990 (2.053) data 0.000 (0.001) loss 1.5348 (1.1687) lr 7.5131e-04 eta 17:23:29
epoch [35/50] batch [1520/2000] time 2.063 (2.053) data 0.000 (0.001) loss 1.1835 (1.1688) lr 7.5131e-04 eta 17:22:45
epoch [35/50] batch [1540/2000] time 2.012 (2.053) data 0.000 (0.001) loss 1.1629 (1.1697) lr 7.5131e-04 eta 17:22:01
epoch [35/50] batch [1560/2000] time 2.066 (2.052) data 0.000 (0.001) loss 0.4930 (1.1723) lr 7.5131e-04 eta 17:21:17
epoch [35/50] batch [1580/2000] time 2.011 (2.052) data 0.000 (0.001) loss 2.0339 (1.1708) lr 7.5131e-04 eta 17:20:29
epoch [35/50] batch [1600/2000] time 2.063 (2.052) data 0.000 (0.001) loss 0.2715 (1.1701) lr 7.5131e-04 eta 17:19:46
epoch [35/50] batch [1620/2000] time 2.012 (2.052) data 0.000 (0.001) loss 1.3061 (1.1717) lr 7.5131e-04 eta 17:19:02
epoch [35/50] batch [1640/2000] time 2.059 (2.052) data 0.000 (0.001) loss 0.3832 (1.1684) lr 7.5131e-04 eta 17:18:17
epoch [35/50] batch [1660/2000] time 2.070 (2.052) data 0.000 (0.001) loss 0.4632 (1.1695) lr 7.5131e-04 eta 17:17:37
epoch [35/50] batch [1680/2000] time 2.044 (2.052) data 0.001 (0.001) loss 0.2250 (1.1698) lr 7.5131e-04 eta 17:16:55
epoch [35/50] batch [1700/2000] time 2.014 (2.052) data 0.000 (0.001) loss 3.7651 (1.1724) lr 7.5131e-04 eta 17:16:10
epoch [35/50] batch [1720/2000] time 2.038 (2.052) data 0.000 (0.001) loss 0.6390 (1.1693) lr 7.5131e-04 eta 17:15:27
epoch [35/50] batch [1740/2000] time 2.049 (2.052) data 0.000 (0.001) loss 1.5976 (1.1698) lr 7.5131e-04 eta 17:14:44
epoch [35/50] batch [1760/2000] time 2.068 (2.052) data 0.000 (0.001) loss 1.2440 (1.1697) lr 7.5131e-04 eta 17:14:05
epoch [35/50] batch [1780/2000] time 2.071 (2.052) data 0.000 (0.001) loss 0.8948 (1.1738) lr 7.5131e-04 eta 17:13:19
epoch [35/50] batch [1800/2000] time 2.011 (2.052) data 0.000 (0.001) loss 3.0938 (1.1759) lr 7.5131e-04 eta 17:12:35
epoch [35/50] batch [1820/2000] time 2.020 (2.051) data 0.000 (0.001) loss 0.7977 (1.1760) lr 7.5131e-04 eta 17:11:50
epoch [35/50] batch [1840/2000] time 2.012 (2.051) data 0.000 (0.001) loss 0.8919 (1.1788) lr 7.5131e-04 eta 17:11:10
epoch [35/50] batch [1860/2000] time 2.008 (2.051) data 0.000 (0.001) loss 3.4990 (1.1764) lr 7.5131e-04 eta 17:10:24
epoch [35/50] batch [1880/2000] time 2.030 (2.051) data 0.000 (0.001) loss 0.4781 (1.1738) lr 7.5131e-04 eta 17:09:45
epoch [35/50] batch [1900/2000] time 2.066 (2.051) data 0.000 (0.001) loss 0.0705 (1.1747) lr 7.5131e-04 eta 17:09:06
epoch [35/50] batch [1920/2000] time 2.071 (2.051) data 0.000 (0.001) loss 1.3989 (1.1725) lr 7.5131e-04 eta 17:08:24
epoch [35/50] batch [1940/2000] time 2.043 (2.051) data 0.000 (0.001) loss 1.2453 (1.1683) lr 7.5131e-04 eta 17:07:44
epoch [35/50] batch [1960/2000] time 2.078 (2.051) data 0.000 (0.001) loss 0.9456 (1.1722) lr 7.5131e-04 eta 17:07:01
epoch [35/50] batch [1980/2000] time 2.038 (2.051) data 0.000 (0.001) loss 1.7691 (1.1763) lr 7.5131e-04 eta 17:06:18
epoch [35/50] batch [2000/2000] time 2.038 (2.051) data 0.000 (0.001) loss 3.2825 (1.1774) lr 6.9098e-04 eta 17:05:35
epoch [36/50] batch [20/2000] time 2.072 (2.089) data 0.000 (0.040) loss 0.3392 (1.3939) lr 6.9098e-04 eta 17:23:44
epoch [36/50] batch [40/2000] time 1.987 (2.064) data 0.000 (0.020) loss 1.9847 (1.3259) lr 6.9098e-04 eta 17:10:32
epoch [36/50] batch [60/2000] time 2.051 (2.059) data 0.001 (0.014) loss 0.9675 (1.3336) lr 6.9098e-04 eta 17:07:17
epoch [36/50] batch [80/2000] time 2.041 (2.054) data 0.000 (0.010) loss 1.7823 (1.2939) lr 6.9098e-04 eta 17:04:11
epoch [36/50] batch [100/2000] time 2.067 (2.051) data 0.000 (0.008) loss 1.1120 (1.2474) lr 6.9098e-04 eta 17:02:09
epoch [36/50] batch [120/2000] time 2.067 (2.049) data 0.000 (0.007) loss 0.7091 (1.1988) lr 6.9098e-04 eta 17:00:35
epoch [36/50] batch [140/2000] time 2.063 (2.049) data 0.000 (0.006) loss 0.4911 (1.2325) lr 6.9098e-04 eta 16:59:41
epoch [36/50] batch [160/2000] time 2.045 (2.047) data 0.000 (0.005) loss 1.1693 (1.2371) lr 6.9098e-04 eta 16:58:04
epoch [36/50] batch [180/2000] time 2.070 (2.047) data 0.000 (0.005) loss 0.2266 (1.2278) lr 6.9098e-04 eta 16:57:12
epoch [36/50] batch [200/2000] time 2.066 (2.047) data 0.005 (0.004) loss 0.7486 (1.2077) lr 6.9098e-04 eta 16:56:46
epoch [36/50] batch [220/2000] time 2.012 (2.047) data 0.000 (0.004) loss 0.8141 (1.1907) lr 6.9098e-04 eta 16:56:08
epoch [36/50] batch [240/2000] time 2.066 (2.047) data 0.000 (0.004) loss 0.8114 (1.1841) lr 6.9098e-04 eta 16:55:13
epoch [36/50] batch [260/2000] time 2.006 (2.047) data 0.000 (0.003) loss 1.2898 (1.2070) lr 6.9098e-04 eta 16:54:25
epoch [36/50] batch [280/2000] time 2.010 (2.046) data 0.000 (0.003) loss 0.3834 (1.1802) lr 6.9098e-04 eta 16:53:25
epoch [36/50] batch [300/2000] time 2.063 (2.046) data 0.000 (0.003) loss 1.7428 (1.1610) lr 6.9098e-04 eta 16:52:46
epoch [36/50] batch [320/2000] time 2.006 (2.046) data 0.000 (0.003) loss 1.6074 (1.1699) lr 6.9098e-04 eta 16:51:57
epoch [36/50] batch [340/2000] time 2.046 (2.045) data 0.000 (0.003) loss 0.0117 (1.1730) lr 6.9098e-04 eta 16:50:55
epoch [36/50] batch [360/2000] time 2.045 (2.045) data 0.000 (0.003) loss 0.1930 (1.1853) lr 6.9098e-04 eta 16:50:11
epoch [36/50] batch [380/2000] time 2.014 (2.045) data 0.000 (0.003) loss 0.9718 (1.1958) lr 6.9098e-04 eta 16:49:26
epoch [36/50] batch [400/2000] time 2.065 (2.045) data 0.000 (0.002) loss 1.4747 (1.1777) lr 6.9098e-04 eta 16:48:38
epoch [36/50] batch [420/2000] time 2.069 (2.044) data 0.000 (0.002) loss 0.3149 (1.1711) lr 6.9098e-04 eta 16:47:50
epoch [36/50] batch [440/2000] time 2.073 (2.045) data 0.000 (0.002) loss 1.0435 (1.1632) lr 6.9098e-04 eta 16:47:19
epoch [36/50] batch [460/2000] time 2.025 (2.045) data 0.000 (0.002) loss 2.3118 (1.1653) lr 6.9098e-04 eta 16:46:41
epoch [36/50] batch [480/2000] time 2.042 (2.045) data 0.000 (0.002) loss 0.7854 (1.1748) lr 6.9098e-04 eta 16:46:01
epoch [36/50] batch [500/2000] time 2.044 (2.045) data 0.000 (0.002) loss 0.7192 (1.1670) lr 6.9098e-04 eta 16:45:24
epoch [36/50] batch [520/2000] time 2.041 (2.045) data 0.000 (0.002) loss 2.8115 (1.1679) lr 6.9098e-04 eta 16:44:44
epoch [36/50] batch [540/2000] time 2.066 (2.045) data 0.000 (0.002) loss 0.2620 (1.1703) lr 6.9098e-04 eta 16:44:05
epoch [36/50] batch [560/2000] time 2.018 (2.045) data 0.000 (0.002) loss 1.6376 (1.1648) lr 6.9098e-04 eta 16:43:33
epoch [36/50] batch [580/2000] time 2.041 (2.045) data 0.000 (0.002) loss 1.1082 (1.1585) lr 6.9098e-04 eta 16:42:50
epoch [36/50] batch [600/2000] time 2.067 (2.045) data 0.001 (0.002) loss 1.0145 (1.1601) lr 6.9098e-04 eta 16:42:08
epoch [36/50] batch [620/2000] time 2.042 (2.046) data 0.000 (0.002) loss 1.1500 (1.1587) lr 6.9098e-04 eta 16:41:37
epoch [36/50] batch [640/2000] time 2.070 (2.046) data 0.000 (0.002) loss 0.0742 (1.1597) lr 6.9098e-04 eta 16:40:56
epoch [36/50] batch [660/2000] time 2.012 (2.045) data 0.000 (0.002) loss 1.7723 (1.1597) lr 6.9098e-04 eta 16:40:11
epoch [36/50] batch [680/2000] time 2.066 (2.045) data 0.000 (0.002) loss 0.7033 (1.1596) lr 6.9098e-04 eta 16:39:30
epoch [36/50] batch [700/2000] time 2.012 (2.045) data 0.000 (0.002) loss 0.5770 (1.1773) lr 6.9098e-04 eta 16:38:46
epoch [36/50] batch [720/2000] time 2.016 (2.045) data 0.000 (0.001) loss 0.5001 (1.1850) lr 6.9098e-04 eta 16:38:06
epoch [36/50] batch [740/2000] time 2.068 (2.045) data 0.000 (0.001) loss 1.7675 (1.1823) lr 6.9098e-04 eta 16:37:26
epoch [36/50] batch [760/2000] time 2.039 (2.045) data 0.000 (0.001) loss 0.3127 (1.1923) lr 6.9098e-04 eta 16:36:46
epoch [36/50] batch [780/2000] time 2.068 (2.045) data 0.000 (0.001) loss 1.4249 (1.1988) lr 6.9098e-04 eta 16:36:01
epoch [36/50] batch [800/2000] time 2.067 (2.045) data 0.000 (0.001) loss 1.0481 (1.1994) lr 6.9098e-04 eta 16:35:17
epoch [36/50] batch [820/2000] time 2.067 (2.045) data 0.000 (0.001) loss 1.3407 (1.2097) lr 6.9098e-04 eta 16:34:31
epoch [36/50] batch [840/2000] time 2.017 (2.045) data 0.000 (0.001) loss 1.7647 (1.2083) lr 6.9098e-04 eta 16:33:47
epoch [36/50] batch [860/2000] time 2.068 (2.045) data 0.000 (0.001) loss 0.2956 (1.2028) lr 6.9098e-04 eta 16:33:07
epoch [36/50] batch [880/2000] time 2.067 (2.045) data 0.000 (0.001) loss 0.7265 (1.2030) lr 6.9098e-04 eta 16:32:24
epoch [36/50] batch [900/2000] time 2.066 (2.045) data 0.000 (0.001) loss 0.9680 (1.1951) lr 6.9098e-04 eta 16:31:46
epoch [36/50] batch [920/2000] time 2.036 (2.045) data 0.000 (0.001) loss 2.3707 (1.1960) lr 6.9098e-04 eta 16:31:03
epoch [36/50] batch [940/2000] time 2.009 (2.045) data 0.000 (0.001) loss 0.2092 (1.1953) lr 6.9098e-04 eta 16:30:20
epoch [36/50] batch [960/2000] time 2.039 (2.045) data 0.000 (0.001) loss 1.3967 (1.1897) lr 6.9098e-04 eta 16:29:35
epoch [36/50] batch [980/2000] time 2.005 (2.044) data 0.000 (0.001) loss 3.8799 (1.1950) lr 6.9098e-04 eta 16:28:49
epoch [36/50] batch [1000/2000] time 2.040 (2.044) data 0.000 (0.001) loss 0.6466 (1.1927) lr 6.9098e-04 eta 16:28:06
epoch [36/50] batch [1020/2000] time 2.066 (2.044) data 0.000 (0.001) loss 0.9721 (1.1885) lr 6.9098e-04 eta 16:27:26
epoch [36/50] batch [1040/2000] time 2.038 (2.044) data 0.000 (0.001) loss 0.4362 (1.1882) lr 6.9098e-04 eta 16:26:43
epoch [36/50] batch [1060/2000] time 2.064 (2.044) data 0.000 (0.001) loss 1.4414 (1.1898) lr 6.9098e-04 eta 16:26:01
epoch [36/50] batch [1080/2000] time 2.011 (2.044) data 0.000 (0.001) loss 1.0613 (1.1866) lr 6.9098e-04 eta 16:25:18
epoch [36/50] batch [1100/2000] time 2.016 (2.044) data 0.000 (0.001) loss 3.3849 (1.1918) lr 6.9098e-04 eta 16:24:36
epoch [36/50] batch [1120/2000] time 2.042 (2.044) data 0.000 (0.001) loss 1.3957 (1.1941) lr 6.9098e-04 eta 16:23:53
epoch [36/50] batch [1140/2000] time 2.073 (2.044) data 0.001 (0.001) loss 0.3278 (1.1946) lr 6.9098e-04 eta 16:23:12
epoch [36/50] batch [1160/2000] time 2.007 (2.044) data 0.001 (0.001) loss 1.8931 (1.1913) lr 6.9098e-04 eta 16:22:34
epoch [36/50] batch [1180/2000] time 2.033 (2.044) data 0.000 (0.001) loss 1.3591 (1.1955) lr 6.9098e-04 eta 16:21:51
epoch [36/50] batch [1200/2000] time 2.052 (2.044) data 0.000 (0.001) loss 1.0575 (1.1915) lr 6.9098e-04 eta 16:21:11
epoch [36/50] batch [1220/2000] time 1.975 (2.044) data 0.000 (0.001) loss 1.6487 (1.1905) lr 6.9098e-04 eta 16:20:22
epoch [36/50] batch [1240/2000] time 2.034 (2.044) data 0.000 (0.001) loss 1.3938 (1.1881) lr 6.9098e-04 eta 16:19:36
epoch [36/50] batch [1260/2000] time 2.031 (2.044) data 0.000 (0.001) loss 1.5253 (1.1875) lr 6.9098e-04 eta 16:18:51
epoch [36/50] batch [1280/2000] time 2.056 (2.043) data 0.000 (0.001) loss 4.4709 (1.1895) lr 6.9098e-04 eta 16:18:06
epoch [36/50] batch [1300/2000] time 2.059 (2.043) data 0.000 (0.001) loss 1.7044 (1.1879) lr 6.9098e-04 eta 16:17:22
epoch [36/50] batch [1320/2000] time 1.982 (2.043) data 0.000 (0.001) loss 0.4207 (1.1919) lr 6.9098e-04 eta 16:16:35
epoch [36/50] batch [1340/2000] time 1.976 (2.043) data 0.000 (0.001) loss 1.9403 (1.1946) lr 6.9098e-04 eta 16:15:51
epoch [36/50] batch [1360/2000] time 2.034 (2.043) data 0.000 (0.001) loss 4.2673 (1.1908) lr 6.9098e-04 eta 16:15:09
epoch [36/50] batch [1380/2000] time 2.036 (2.043) data 0.000 (0.001) loss 0.5980 (1.1890) lr 6.9098e-04 eta 16:14:26
epoch [36/50] batch [1400/2000] time 2.005 (2.043) data 0.000 (0.001) loss 1.8926 (1.1840) lr 6.9098e-04 eta 16:13:39
epoch [36/50] batch [1420/2000] time 2.057 (2.043) data 0.000 (0.001) loss 2.0127 (1.1851) lr 6.9098e-04 eta 16:12:55
epoch [36/50] batch [1440/2000] time 2.008 (2.043) data 0.000 (0.001) loss 0.1565 (1.1815) lr 6.9098e-04 eta 16:12:14
epoch [36/50] batch [1460/2000] time 2.039 (2.043) data 0.000 (0.001) loss 0.9266 (1.1834) lr 6.9098e-04 eta 16:11:35
epoch [36/50] batch [1480/2000] time 2.055 (2.043) data 0.001 (0.001) loss 0.2946 (1.1854) lr 6.9098e-04 eta 16:10:58
epoch [36/50] batch [1500/2000] time 2.058 (2.043) data 0.000 (0.001) loss 0.2577 (1.1852) lr 6.9098e-04 eta 16:10:21
epoch [36/50] batch [1520/2000] time 2.013 (2.043) data 0.000 (0.001) loss 0.9237 (1.1875) lr 6.9098e-04 eta 16:09:40
epoch [36/50] batch [1540/2000] time 2.040 (2.043) data 0.000 (0.001) loss 0.6106 (1.1879) lr 6.9098e-04 eta 16:09:02
epoch [36/50] batch [1560/2000] time 2.064 (2.043) data 0.000 (0.001) loss 1.1406 (1.1871) lr 6.9098e-04 eta 16:08:20
epoch [36/50] batch [1580/2000] time 2.063 (2.043) data 0.000 (0.001) loss 1.4676 (1.1827) lr 6.9098e-04 eta 16:07:40
epoch [36/50] batch [1600/2000] time 2.006 (2.043) data 0.000 (0.001) loss 0.1010 (1.1818) lr 6.9098e-04 eta 16:06:59
epoch [36/50] batch [1620/2000] time 2.045 (2.043) data 0.000 (0.001) loss 1.9353 (1.1777) lr 6.9098e-04 eta 16:06:21
epoch [36/50] batch [1640/2000] time 2.005 (2.043) data 0.000 (0.001) loss 0.7376 (1.1745) lr 6.9098e-04 eta 16:05:40
epoch [36/50] batch [1660/2000] time 2.062 (2.043) data 0.000 (0.001) loss 0.1975 (1.1711) lr 6.9098e-04 eta 16:04:57
epoch [36/50] batch [1680/2000] time 2.065 (2.043) data 0.000 (0.001) loss 1.9489 (1.1744) lr 6.9098e-04 eta 16:04:17
epoch [36/50] batch [1700/2000] time 2.070 (2.043) data 0.000 (0.001) loss 1.6328 (1.1736) lr 6.9098e-04 eta 16:03:41
epoch [36/50] batch [1720/2000] time 2.073 (2.043) data 0.000 (0.001) loss 0.5262 (1.1693) lr 6.9098e-04 eta 16:03:02
epoch [36/50] batch [1740/2000] time 2.060 (2.043) data 0.000 (0.001) loss 2.3197 (1.1704) lr 6.9098e-04 eta 16:02:27
epoch [36/50] batch [1760/2000] time 2.060 (2.044) data 0.000 (0.001) loss 0.0165 (1.1676) lr 6.9098e-04 eta 16:01:51
epoch [36/50] batch [1780/2000] time 2.081 (2.044) data 0.000 (0.001) loss 2.8089 (1.1643) lr 6.9098e-04 eta 16:01:25
epoch [36/50] batch [1800/2000] time 2.006 (2.044) data 0.000 (0.001) loss 2.6094 (1.1643) lr 6.9098e-04 eta 16:00:47
epoch [36/50] batch [1820/2000] time 2.066 (2.044) data 0.003 (0.001) loss 0.6492 (1.1624) lr 6.9098e-04 eta 16:00:05
epoch [36/50] batch [1840/2000] time 2.065 (2.044) data 0.000 (0.001) loss 3.4511 (1.1625) lr 6.9098e-04 eta 15:59:25
epoch [36/50] batch [1860/2000] time 2.053 (2.044) data 0.000 (0.001) loss 1.7176 (1.1641) lr 6.9098e-04 eta 15:58:48
epoch [36/50] batch [1880/2000] time 2.059 (2.045) data 0.001 (0.001) loss 1.4402 (1.1608) lr 6.9098e-04 eta 15:58:13
epoch [36/50] batch [1900/2000] time 2.010 (2.045) data 0.000 (0.001) loss 0.0688 (1.1641) lr 6.9098e-04 eta 15:57:34
epoch [36/50] batch [1920/2000] time 2.073 (2.045) data 0.000 (0.001) loss 0.9487 (1.1631) lr 6.9098e-04 eta 15:56:53
epoch [36/50] batch [1940/2000] time 2.053 (2.045) data 0.000 (0.001) loss 0.7895 (1.1629) lr 6.9098e-04 eta 15:56:14
epoch [36/50] batch [1960/2000] time 2.424 (2.046) data 0.000 (0.001) loss 3.8463 (1.1642) lr 6.9098e-04 eta 15:56:01
epoch [36/50] batch [1980/2000] time 2.417 (2.049) data 0.000 (0.001) loss 0.0503 (1.1696) lr 6.9098e-04 eta 15:57:03
epoch [36/50] batch [2000/2000] time 2.363 (2.053) data 0.000 (0.001) loss 1.0128 (1.1712) lr 6.3188e-04 eta 15:58:06
epoch [37/50] batch [20/2000] time 2.432 (2.452) data 0.001 (0.035) loss 0.6165 (1.0996) lr 6.3188e-04 eta 19:03:38
epoch [37/50] batch [40/2000] time 2.388 (2.434) data 0.005 (0.018) loss 0.5893 (1.2953) lr 6.3188e-04 eta 18:54:14
epoch [37/50] batch [60/2000] time 2.467 (2.435) data 0.010 (0.012) loss 0.3801 (1.1971) lr 6.3188e-04 eta 18:53:59
epoch [37/50] batch [80/2000] time 2.474 (2.439) data 0.000 (0.010) loss 0.5282 (1.1517) lr 6.3188e-04 eta 18:55:04
epoch [37/50] batch [100/2000] time 2.365 (2.437) data 0.000 (0.008) loss 0.1141 (1.1665) lr 6.3188e-04 eta 18:53:07
epoch [37/50] batch [120/2000] time 2.439 (2.434) data 0.001 (0.007) loss 0.3467 (1.2379) lr 6.3188e-04 eta 18:51:00
epoch [37/50] batch [140/2000] time 2.365 (2.432) data 0.000 (0.006) loss 1.8983 (1.2477) lr 6.3188e-04 eta 18:49:07
epoch [37/50] batch [160/2000] time 2.425 (2.430) data 0.000 (0.005) loss 0.9361 (1.2456) lr 6.3188e-04 eta 18:47:24
epoch [37/50] batch [180/2000] time 2.435 (2.430) data 0.000 (0.005) loss 3.4097 (1.2667) lr 6.3188e-04 eta 18:46:39
epoch [37/50] batch [200/2000] time 2.412 (2.428) data 0.000 (0.004) loss 0.6472 (1.2368) lr 6.3188e-04 eta 18:44:58
epoch [37/50] batch [220/2000] time 2.444 (2.426) data 0.004 (0.004) loss 0.7097 (1.2642) lr 6.3188e-04 eta 18:43:06
epoch [37/50] batch [240/2000] time 2.449 (2.426) data 0.000 (0.004) loss 1.3660 (1.2492) lr 6.3188e-04 eta 18:42:15
epoch [37/50] batch [260/2000] time 2.393 (2.425) data 0.000 (0.003) loss 1.7704 (1.2405) lr 6.3188e-04 eta 18:40:59
epoch [37/50] batch [280/2000] time 2.438 (2.425) data 0.000 (0.003) loss 2.0176 (1.2433) lr 6.3188e-04 eta 18:40:26
epoch [37/50] batch [300/2000] time 2.443 (2.424) data 0.000 (0.003) loss 1.1800 (1.2025) lr 6.3188e-04 eta 18:39:17
epoch [37/50] batch [320/2000] time 2.473 (2.424) data 0.000 (0.003) loss 1.7087 (1.2012) lr 6.3188e-04 eta 18:38:28
epoch [37/50] batch [340/2000] time 2.389 (2.424) data 0.000 (0.003) loss 0.4353 (1.2165) lr 6.3188e-04 eta 18:37:29
epoch [37/50] batch [360/2000] time 2.389 (2.424) data 0.000 (0.003) loss 1.5554 (1.2197) lr 6.3188e-04 eta 18:36:28
epoch [37/50] batch [380/2000] time 2.385 (2.423) data 0.000 (0.002) loss 1.4840 (1.2180) lr 6.3188e-04 eta 18:35:22
epoch [37/50] batch [400/2000] time 2.437 (2.422) data 0.000 (0.002) loss 0.5699 (1.2181) lr 6.3188e-04 eta 18:34:11
epoch [37/50] batch [420/2000] time 2.875 (2.423) data 0.000 (0.002) loss 3.1094 (1.2332) lr 6.3188e-04 eta 18:33:56
epoch [37/50] batch [440/2000] time 2.914 (2.445) data 0.000 (0.002) loss 1.9575 (1.2316) lr 6.3188e-04 eta 18:43:17
epoch [37/50] batch [460/2000] time 2.415 (2.466) data 0.000 (0.002) loss 0.8510 (1.2272) lr 6.3188e-04 eta 18:51:46
epoch [37/50] batch [480/2000] time 2.753 (2.484) data 0.012 (0.002) loss 3.0766 (1.2205) lr 6.3188e-04 eta 18:59:21
epoch [37/50] batch [500/2000] time 2.838 (2.499) data 0.000 (0.002) loss 1.0103 (1.2350) lr 6.3188e-04 eta 19:05:34
epoch [37/50] batch [520/2000] time 3.017 (2.515) data 0.000 (0.002) loss 0.1927 (1.2412) lr 6.3188e-04 eta 19:11:56
epoch [37/50] batch [540/2000] time 3.067 (2.529) data 0.000 (0.002) loss 0.0461 (1.2403) lr 6.3188e-04 eta 19:17:37
epoch [37/50] batch [560/2000] time 2.382 (2.543) data 0.000 (0.002) loss 0.5957 (1.2403) lr 6.3188e-04 eta 19:22:46
epoch [37/50] batch [580/2000] time 2.040 (2.554) data 0.006 (0.002) loss 1.5809 (1.2378) lr 6.3188e-04 eta 19:26:58
epoch [37/50] batch [600/2000] time 2.003 (2.537) data 0.001 (0.002) loss 0.3584 (1.2491) lr 6.3188e-04 eta 19:18:29
epoch [37/50] batch [620/2000] time 2.070 (2.521) data 0.000 (0.002) loss 1.9430 (1.2546) lr 6.3188e-04 eta 19:10:24
epoch [37/50] batch [640/2000] time 2.017 (2.506) data 0.000 (0.002) loss 1.2230 (1.2555) lr 6.3188e-04 eta 19:02:54
epoch [37/50] batch [660/2000] time 2.067 (2.493) data 0.000 (0.002) loss 0.3462 (1.2542) lr 6.3188e-04 eta 18:55:51
epoch [37/50] batch [680/2000] time 2.058 (2.479) data 0.000 (0.002) loss 1.1845 (1.2477) lr 6.3188e-04 eta 18:48:57
epoch [37/50] batch [700/2000] time 1.997 (2.467) data 0.000 (0.002) loss 3.2425 (1.2614) lr 6.3188e-04 eta 18:42:29
epoch [37/50] batch [720/2000] time 2.096 (2.455) data 0.001 (0.002) loss 1.5475 (1.2619) lr 6.3188e-04 eta 18:36:15
epoch [37/50] batch [740/2000] time 2.054 (2.444) data 0.000 (0.002) loss 0.1933 (1.2546) lr 6.3188e-04 eta 18:30:35
epoch [37/50] batch [760/2000] time 2.019 (2.435) data 0.000 (0.002) loss 2.0447 (1.2493) lr 6.3188e-04 eta 18:25:18
epoch [37/50] batch [780/2000] time 2.033 (2.424) data 0.000 (0.001) loss 0.1246 (1.2381) lr 6.3188e-04 eta 18:19:54
epoch [37/50] batch [800/2000] time 2.035 (2.415) data 0.000 (0.001) loss 0.4427 (1.2285) lr 6.3188e-04 eta 18:14:44
epoch [37/50] batch [820/2000] time 2.054 (2.406) data 0.000 (0.001) loss 1.5505 (1.2355) lr 6.3188e-04 eta 18:09:47
epoch [37/50] batch [840/2000] time 2.041 (2.397) data 0.000 (0.001) loss 0.2672 (1.2226) lr 6.3188e-04 eta 18:05:05
epoch [37/50] batch [860/2000] time 2.002 (2.389) data 0.000 (0.001) loss 0.6765 (1.2227) lr 6.3188e-04 eta 18:00:33
epoch [37/50] batch [880/2000] time 2.115 (2.382) data 0.000 (0.001) loss 0.2178 (1.2216) lr 6.3188e-04 eta 17:56:36
epoch [37/50] batch [900/2000] time 2.003 (2.374) data 0.000 (0.001) loss 0.9485 (1.2259) lr 6.3188e-04 eta 17:52:28
epoch [37/50] batch [920/2000] time 2.012 (2.368) data 0.000 (0.001) loss 1.3163 (1.2225) lr 6.3188e-04 eta 17:48:35
epoch [37/50] batch [940/2000] time 2.041 (2.361) data 0.000 (0.001) loss 0.3783 (1.2169) lr 6.3188e-04 eta 17:44:48
epoch [37/50] batch [960/2000] time 2.000 (2.354) data 0.000 (0.001) loss 0.1342 (1.2094) lr 6.3188e-04 eta 17:41:03
epoch [37/50] batch [980/2000] time 1.982 (2.348) data 0.000 (0.001) loss 2.7811 (1.2071) lr 6.3188e-04 eta 17:37:25
epoch [37/50] batch [1000/2000] time 2.063 (2.342) data 0.000 (0.001) loss 2.5779 (1.2050) lr 6.3188e-04 eta 17:33:59
epoch [37/50] batch [1020/2000] time 2.061 (2.336) data 0.000 (0.001) loss 0.1155 (1.2009) lr 6.3188e-04 eta 17:30:35
epoch [37/50] batch [1040/2000] time 2.066 (2.331) data 0.000 (0.001) loss 0.4710 (1.1999) lr 6.3188e-04 eta 17:27:20
epoch [37/50] batch [1060/2000] time 2.027 (2.326) data 0.000 (0.001) loss 1.0774 (1.1985) lr 6.3188e-04 eta 17:24:16
epoch [37/50] batch [1080/2000] time 2.003 (2.321) data 0.000 (0.001) loss 0.9261 (1.2044) lr 6.3188e-04 eta 17:21:15
epoch [37/50] batch [1100/2000] time 2.033 (2.316) data 0.000 (0.001) loss 1.7176 (1.2047) lr 6.3188e-04 eta 17:18:16
epoch [37/50] batch [1120/2000] time 2.052 (2.311) data 0.000 (0.001) loss 1.5340 (1.2090) lr 6.3188e-04 eta 17:15:19
epoch [37/50] batch [1140/2000] time 2.073 (2.306) data 0.001 (0.001) loss 1.5559 (1.2104) lr 6.3188e-04 eta 17:12:26
epoch [37/50] batch [1160/2000] time 2.045 (2.302) data 0.000 (0.001) loss 1.4805 (1.2076) lr 6.3188e-04 eta 17:09:33
epoch [37/50] batch [1180/2000] time 2.003 (2.297) data 0.000 (0.001) loss 0.0872 (1.2058) lr 6.3188e-04 eta 17:06:53
epoch [37/50] batch [1200/2000] time 2.070 (2.293) data 0.000 (0.001) loss 2.4690 (1.2103) lr 6.3188e-04 eta 17:04:21
epoch [37/50] batch [1220/2000] time 2.066 (2.290) data 0.001 (0.001) loss 0.8882 (1.2091) lr 6.3188e-04 eta 17:01:54
epoch [37/50] batch [1240/2000] time 2.014 (2.285) data 0.000 (0.001) loss 0.2054 (1.2078) lr 6.3188e-04 eta 16:59:18
epoch [37/50] batch [1260/2000] time 2.057 (2.281) data 0.000 (0.001) loss 2.1734 (1.2041) lr 6.3188e-04 eta 16:56:46
epoch [37/50] batch [1280/2000] time 2.006 (2.278) data 0.000 (0.001) loss 1.0261 (1.2034) lr 6.3188e-04 eta 16:54:18
epoch [37/50] batch [1300/2000] time 2.004 (2.274) data 0.000 (0.001) loss 1.2080 (1.1997) lr 6.3188e-04 eta 16:51:54
epoch [37/50] batch [1320/2000] time 2.054 (2.270) data 0.000 (0.001) loss 2.7592 (1.1978) lr 6.3188e-04 eta 16:49:34
epoch [37/50] batch [1340/2000] time 2.030 (2.267) data 0.000 (0.001) loss 0.3605 (1.2010) lr 6.3188e-04 eta 16:47:16
epoch [37/50] batch [1360/2000] time 2.035 (2.264) data 0.000 (0.001) loss 5.1697 (1.2040) lr 6.3188e-04 eta 16:45:03
epoch [37/50] batch [1380/2000] time 2.045 (2.261) data 0.000 (0.001) loss 1.5078 (1.2059) lr 6.3188e-04 eta 16:43:02
epoch [37/50] batch [1400/2000] time 2.053 (2.258) data 0.000 (0.001) loss 2.0345 (1.2055) lr 6.3188e-04 eta 16:40:52
epoch [37/50] batch [1420/2000] time 2.052 (2.255) data 0.000 (0.001) loss 1.3316 (1.2019) lr 6.3188e-04 eta 16:38:46
epoch [37/50] batch [1440/2000] time 2.068 (2.252) data 0.000 (0.001) loss 0.3365 (1.2045) lr 6.3188e-04 eta 16:36:44
epoch [37/50] batch [1460/2000] time 2.060 (2.249) data 0.000 (0.001) loss 1.1350 (1.2033) lr 6.3188e-04 eta 16:34:40
epoch [37/50] batch [1480/2000] time 2.069 (2.246) data 0.000 (0.001) loss 1.4376 (1.2069) lr 6.3188e-04 eta 16:32:46
epoch [37/50] batch [1500/2000] time 2.156 (2.244) data 0.000 (0.001) loss 2.2142 (1.2051) lr 6.3188e-04 eta 16:30:53
epoch [37/50] batch [1520/2000] time 2.048 (2.241) data 0.000 (0.001) loss 1.4146 (1.2024) lr 6.3188e-04 eta 16:28:56
epoch [37/50] batch [1540/2000] time 2.073 (2.238) data 0.000 (0.001) loss 0.8340 (1.1994) lr 6.3188e-04 eta 16:27:05
epoch [37/50] batch [1560/2000] time 2.058 (2.236) data 0.000 (0.001) loss 2.6009 (1.1994) lr 6.3188e-04 eta 16:25:16
epoch [37/50] batch [1580/2000] time 2.021 (2.233) data 0.000 (0.001) loss 0.1231 (1.1977) lr 6.3188e-04 eta 16:23:26
epoch [37/50] batch [1600/2000] time 2.106 (2.231) data 0.000 (0.001) loss 0.4258 (1.1951) lr 6.3188e-04 eta 16:21:40
epoch [37/50] batch [1620/2000] time 2.018 (2.229) data 0.000 (0.001) loss 1.6170 (1.1965) lr 6.3188e-04 eta 16:19:56
epoch [37/50] batch [1640/2000] time 2.009 (2.227) data 0.000 (0.001) loss 2.1546 (1.1970) lr 6.3188e-04 eta 16:18:15
epoch [37/50] batch [1660/2000] time 2.070 (2.225) data 0.000 (0.001) loss 1.2072 (1.1961) lr 6.3188e-04 eta 16:16:35
epoch [37/50] batch [1680/2000] time 2.012 (2.222) data 0.001 (0.001) loss 0.8475 (1.1934) lr 6.3188e-04 eta 16:14:54
epoch [37/50] batch [1700/2000] time 2.070 (2.221) data 0.000 (0.001) loss 0.3652 (1.1952) lr 6.3188e-04 eta 16:13:19
epoch [37/50] batch [1720/2000] time 2.008 (2.219) data 0.000 (0.001) loss 0.1967 (1.1969) lr 6.3188e-04 eta 16:11:45
epoch [37/50] batch [1740/2000] time 2.067 (2.217) data 0.000 (0.001) loss 1.6723 (1.1965) lr 6.3188e-04 eta 16:10:08
epoch [37/50] batch [1760/2000] time 2.022 (2.215) data 0.005 (0.001) loss 1.1489 (1.1921) lr 6.3188e-04 eta 16:08:46
epoch [37/50] batch [1780/2000] time 2.064 (2.214) data 0.000 (0.001) loss 0.0358 (1.1951) lr 6.3188e-04 eta 16:07:19
epoch [37/50] batch [1800/2000] time 2.041 (2.212) data 0.000 (0.001) loss 2.9924 (1.1973) lr 6.3188e-04 eta 16:05:45
epoch [37/50] batch [1820/2000] time 2.067 (2.210) data 0.000 (0.001) loss 1.2336 (1.1943) lr 6.3188e-04 eta 16:04:13
epoch [37/50] batch [1840/2000] time 2.006 (2.208) data 0.000 (0.001) loss 2.3083 (1.1949) lr 6.3188e-04 eta 16:02:44
epoch [37/50] batch [1860/2000] time 2.060 (2.206) data 0.000 (0.001) loss 2.2634 (1.1982) lr 6.3188e-04 eta 16:01:15
epoch [37/50] batch [1880/2000] time 2.019 (2.205) data 0.000 (0.001) loss 0.1245 (1.1950) lr 6.3188e-04 eta 15:59:48
epoch [37/50] batch [1900/2000] time 2.048 (2.203) data 0.000 (0.001) loss 1.2220 (1.1986) lr 6.3188e-04 eta 15:58:24
epoch [37/50] batch [1920/2000] time 2.051 (2.202) data 0.000 (0.001) loss 0.2995 (1.1984) lr 6.3188e-04 eta 15:56:59
epoch [37/50] batch [1940/2000] time 2.077 (2.201) data 0.009 (0.001) loss 0.1909 (1.1951) lr 6.3188e-04 eta 15:55:50
epoch [37/50] batch [1960/2000] time 2.055 (2.199) data 0.000 (0.001) loss 0.2387 (1.1922) lr 6.3188e-04 eta 15:54:26
epoch [37/50] batch [1980/2000] time 2.065 (2.198) data 0.000 (0.001) loss 0.5145 (1.1911) lr 6.3188e-04 eta 15:53:04
epoch [37/50] batch [2000/2000] time 2.063 (2.196) data 0.000 (0.001) loss 0.4260 (1.1904) lr 5.7422e-04 eta 15:51:42
epoch [38/50] batch [20/2000] time 2.071 (2.093) data 0.000 (0.043) loss 2.5134 (1.2602) lr 5.7422e-04 eta 15:06:17
epoch [38/50] batch [40/2000] time 2.012 (2.073) data 0.000 (0.022) loss 0.3788 (1.2087) lr 5.7422e-04 eta 14:56:45
epoch [38/50] batch [60/2000] time 2.069 (2.067) data 0.004 (0.015) loss 0.5183 (1.1587) lr 5.7422e-04 eta 14:53:41
epoch [38/50] batch [80/2000] time 2.065 (2.068) data 0.001 (0.011) loss 0.2159 (1.1253) lr 5.7422e-04 eta 14:53:34
epoch [38/50] batch [100/2000] time 2.049 (2.067) data 0.000 (0.009) loss 0.2844 (1.0873) lr 5.7422e-04 eta 14:52:16
epoch [38/50] batch [120/2000] time 2.069 (2.063) data 0.000 (0.008) loss 0.7805 (1.0801) lr 5.7422e-04 eta 14:50:01
epoch [38/50] batch [140/2000] time 2.039 (2.062) data 0.000 (0.007) loss 2.8266 (1.1285) lr 5.7422e-04 eta 14:48:49
epoch [38/50] batch [160/2000] time 2.153 (2.064) data 0.007 (0.006) loss 0.6130 (1.0934) lr 5.7422e-04 eta 14:48:45
epoch [38/50] batch [180/2000] time 2.062 (2.064) data 0.000 (0.006) loss 0.7048 (1.1274) lr 5.7422e-04 eta 14:48:04
epoch [38/50] batch [200/2000] time 2.065 (2.065) data 0.000 (0.005) loss 0.6891 (1.1491) lr 5.7422e-04 eta 14:47:47
epoch [38/50] batch [220/2000] time 2.080 (2.064) data 0.000 (0.005) loss 2.4049 (1.1445) lr 5.7422e-04 eta 14:46:44
epoch [38/50] batch [240/2000] time 2.047 (2.062) data 0.000 (0.004) loss 0.7019 (1.1373) lr 5.7422e-04 eta 14:45:24
epoch [38/50] batch [260/2000] time 2.040 (2.061) data 0.000 (0.004) loss 3.8165 (1.1597) lr 5.7422e-04 eta 14:44:11
epoch [38/50] batch [280/2000] time 2.039 (2.060) data 0.000 (0.004) loss 1.4474 (1.1629) lr 5.7422e-04 eta 14:43:05
epoch [38/50] batch [300/2000] time 2.045 (2.060) data 0.000 (0.004) loss 0.5187 (1.1719) lr 5.7422e-04 eta 14:42:09
epoch [38/50] batch [320/2000] time 2.068 (2.059) data 0.000 (0.004) loss 1.0984 (1.1865) lr 5.7422e-04 eta 14:41:26
epoch [38/50] batch [340/2000] time 2.038 (2.059) data 0.000 (0.003) loss 2.0260 (1.1961) lr 5.7422e-04 eta 14:40:27
epoch [38/50] batch [360/2000] time 2.040 (2.059) data 0.000 (0.003) loss 0.0991 (1.2004) lr 5.7422e-04 eta 14:39:45
epoch [38/50] batch [380/2000] time 2.080 (2.058) data 0.000 (0.003) loss 1.8508 (1.2283) lr 5.7422e-04 eta 14:38:43
epoch [38/50] batch [400/2000] time 2.026 (2.058) data 0.001 (0.003) loss 1.1173 (1.2346) lr 5.7422e-04 eta 14:38:09
epoch [38/50] batch [420/2000] time 2.058 (2.058) data 0.000 (0.003) loss 1.1737 (1.2239) lr 5.7422e-04 eta 14:37:15
epoch [38/50] batch [440/2000] time 2.057 (2.057) data 0.000 (0.003) loss 3.0963 (1.2082) lr 5.7422e-04 eta 14:36:17
epoch [38/50] batch [460/2000] time 2.054 (2.057) data 0.000 (0.003) loss 0.7257 (1.2143) lr 5.7422e-04 eta 14:35:37
epoch [38/50] batch [480/2000] time 2.008 (2.057) data 0.000 (0.003) loss 2.3839 (1.2081) lr 5.7422e-04 eta 14:34:44
epoch [38/50] batch [500/2000] time 2.011 (2.056) data 0.000 (0.003) loss 0.3970 (1.1978) lr 5.7422e-04 eta 14:33:48
epoch [38/50] batch [520/2000] time 2.040 (2.056) data 0.000 (0.002) loss 0.2353 (1.1928) lr 5.7422e-04 eta 14:32:59
epoch [38/50] batch [540/2000] time 2.048 (2.055) data 0.000 (0.002) loss 0.7268 (1.1921) lr 5.7422e-04 eta 14:32:08
epoch [38/50] batch [560/2000] time 1.988 (2.055) data 0.000 (0.002) loss 0.2416 (1.1805) lr 5.7422e-04 eta 14:31:17
epoch [38/50] batch [580/2000] time 2.022 (2.055) data 0.000 (0.002) loss 2.5475 (1.1836) lr 5.7422e-04 eta 14:30:31
epoch [38/50] batch [600/2000] time 2.068 (2.054) data 0.001 (0.002) loss 0.0940 (1.1825) lr 5.7422e-04 eta 14:29:32
epoch [38/50] batch [620/2000] time 2.078 (2.054) data 0.000 (0.002) loss 0.4511 (1.1802) lr 5.7422e-04 eta 14:28:50
epoch [38/50] batch [640/2000] time 2.062 (2.054) data 0.000 (0.002) loss 0.5323 (1.1854) lr 5.7422e-04 eta 14:28:08
epoch [38/50] batch [660/2000] time 2.013 (2.054) data 0.000 (0.002) loss 0.9364 (1.1805) lr 5.7422e-04 eta 14:27:27
epoch [38/50] batch [680/2000] time 2.066 (2.054) data 0.000 (0.002) loss 2.7378 (1.1827) lr 5.7422e-04 eta 14:26:40
epoch [38/50] batch [700/2000] time 2.008 (2.053) data 0.000 (0.002) loss 1.8621 (1.1847) lr 5.7422e-04 eta 14:25:41
epoch [38/50] batch [720/2000] time 2.130 (2.053) data 0.000 (0.002) loss 1.9285 (1.1852) lr 5.7422e-04 eta 14:25:05
epoch [38/50] batch [740/2000] time 2.062 (2.053) data 0.000 (0.002) loss 0.8962 (1.1820) lr 5.7422e-04 eta 14:24:15
epoch [38/50] batch [760/2000] time 2.065 (2.053) data 0.000 (0.002) loss 0.1459 (1.1807) lr 5.7422e-04 eta 14:23:26
epoch [38/50] batch [780/2000] time 2.008 (2.052) data 0.000 (0.002) loss 0.3960 (1.1715) lr 5.7422e-04 eta 14:22:40
epoch [38/50] batch [800/2000] time 2.005 (2.052) data 0.000 (0.002) loss 0.4910 (1.1816) lr 5.7422e-04 eta 14:21:59
epoch [38/50] batch [820/2000] time 2.059 (2.052) data 0.000 (0.002) loss 0.6881 (1.1785) lr 5.7422e-04 eta 14:21:03
epoch [38/50] batch [840/2000] time 2.059 (2.052) data 0.000 (0.002) loss 0.8119 (1.1757) lr 5.7422e-04 eta 14:20:17
epoch [38/50] batch [860/2000] time 2.058 (2.052) data 0.000 (0.002) loss 2.2310 (1.1807) lr 5.7422e-04 eta 14:19:35
epoch [38/50] batch [880/2000] time 2.005 (2.052) data 0.000 (0.002) loss 1.1143 (1.1788) lr 5.7422e-04 eta 14:19:14
epoch [38/50] batch [900/2000] time 2.056 (2.052) data 0.000 (0.002) loss 0.2985 (1.1797) lr 5.7422e-04 eta 14:18:25
epoch [38/50] batch [920/2000] time 2.069 (2.052) data 0.000 (0.002) loss 1.1941 (1.1857) lr 5.7422e-04 eta 14:17:38
epoch [38/50] batch [940/2000] time 2.063 (2.051) data 0.000 (0.002) loss 2.9205 (1.1894) lr 5.7422e-04 eta 14:16:49
epoch [38/50] batch [960/2000] time 2.071 (2.052) data 0.000 (0.002) loss 2.0988 (1.1900) lr 5.7422e-04 eta 14:16:17
epoch [38/50] batch [980/2000] time 2.068 (2.052) data 0.000 (0.002) loss 1.2390 (1.1875) lr 5.7422e-04 eta 14:15:32
epoch [38/50] batch [1000/2000] time 2.005 (2.052) data 0.000 (0.001) loss 2.2144 (1.1840) lr 5.7422e-04 eta 14:14:53
epoch [38/50] batch [1020/2000] time 1.985 (2.052) data 0.000 (0.001) loss 0.2313 (1.1831) lr 5.7422e-04 eta 14:14:11
epoch [38/50] batch [1040/2000] time 2.045 (2.052) data 0.000 (0.001) loss 1.0240 (1.1833) lr 5.7422e-04 eta 14:13:41
epoch [38/50] batch [1060/2000] time 2.021 (2.052) data 0.000 (0.001) loss 3.8491 (1.1794) lr 5.7422e-04 eta 14:12:58
epoch [38/50] batch [1080/2000] time 2.042 (2.052) data 0.002 (0.001) loss 0.9315 (1.1828) lr 5.7422e-04 eta 14:12:13
epoch [38/50] batch [1100/2000] time 2.066 (2.052) data 0.000 (0.001) loss 0.1663 (1.1778) lr 5.7422e-04 eta 14:11:34
epoch [38/50] batch [1120/2000] time 2.104 (2.052) data 0.001 (0.001) loss 0.3064 (1.1788) lr 5.7422e-04 eta 14:11:03
epoch [38/50] batch [1140/2000] time 2.060 (2.053) data 0.001 (0.001) loss 0.8175 (1.1717) lr 5.7422e-04 eta 14:10:39
epoch [38/50] batch [1160/2000] time 2.041 (2.053) data 0.000 (0.001) loss 0.9135 (1.1710) lr 5.7422e-04 eta 14:09:54
epoch [38/50] batch [1180/2000] time 2.011 (2.053) data 0.000 (0.001) loss 1.1020 (1.1693) lr 5.7422e-04 eta 14:09:08
epoch [38/50] batch [1200/2000] time 2.066 (2.053) data 0.000 (0.001) loss 1.2710 (1.1710) lr 5.7422e-04 eta 14:08:26
epoch [38/50] batch [1220/2000] time 2.101 (2.053) data 0.000 (0.001) loss 0.1295 (1.1688) lr 5.7422e-04 eta 14:07:50
epoch [38/50] batch [1240/2000] time 2.017 (2.053) data 0.000 (0.001) loss 1.8390 (1.1744) lr 5.7422e-04 eta 14:07:07
epoch [38/50] batch [1260/2000] time 2.074 (2.053) data 0.000 (0.001) loss 0.3779 (1.1741) lr 5.7422e-04 eta 14:06:22
epoch [38/50] batch [1280/2000] time 2.070 (2.053) data 0.000 (0.001) loss 1.3747 (1.1735) lr 5.7422e-04 eta 14:05:40
epoch [38/50] batch [1300/2000] time 2.026 (2.052) data 0.003 (0.001) loss 1.1604 (1.1732) lr 5.7422e-04 eta 14:04:55
epoch [38/50] batch [1320/2000] time 2.011 (2.053) data 0.000 (0.001) loss 1.2325 (1.1739) lr 5.7422e-04 eta 14:04:18
epoch [38/50] batch [1340/2000] time 2.061 (2.053) data 0.000 (0.001) loss 0.4158 (1.1699) lr 5.7422e-04 eta 14:03:35
epoch [38/50] batch [1360/2000] time 2.017 (2.053) data 0.000 (0.001) loss 0.2390 (1.1738) lr 5.7422e-04 eta 14:02:57
epoch [38/50] batch [1380/2000] time 2.114 (2.053) data 0.006 (0.001) loss 0.8834 (1.1712) lr 5.7422e-04 eta 14:02:20
epoch [38/50] batch [1400/2000] time 2.015 (2.053) data 0.000 (0.001) loss 1.8078 (1.1717) lr 5.7422e-04 eta 14:01:49
epoch [38/50] batch [1420/2000] time 1.982 (2.053) data 0.000 (0.001) loss 0.0226 (1.1701) lr 5.7422e-04 eta 14:01:04
epoch [38/50] batch [1440/2000] time 2.007 (2.053) data 0.000 (0.001) loss 0.3062 (1.1660) lr 5.7422e-04 eta 14:00:22
epoch [38/50] batch [1460/2000] time 2.046 (2.053) data 0.000 (0.001) loss 0.6718 (1.1638) lr 5.7422e-04 eta 13:59:39
epoch [38/50] batch [1480/2000] time 2.085 (2.053) data 0.000 (0.001) loss 2.7542 (1.1678) lr 5.7422e-04 eta 13:58:57
epoch [38/50] batch [1500/2000] time 2.012 (2.053) data 0.000 (0.001) loss 0.6149 (1.1657) lr 5.7422e-04 eta 13:58:14
epoch [38/50] batch [1520/2000] time 2.057 (2.053) data 0.000 (0.001) loss 0.1786 (1.1619) lr 5.7422e-04 eta 13:57:37
epoch [38/50] batch [1540/2000] time 2.075 (2.053) data 0.000 (0.001) loss 0.2450 (1.1605) lr 5.7422e-04 eta 13:56:55
epoch [38/50] batch [1560/2000] time 1.987 (2.053) data 0.000 (0.001) loss 1.3429 (1.1616) lr 5.7422e-04 eta 13:56:12
epoch [38/50] batch [1580/2000] time 1.999 (2.053) data 0.000 (0.001) loss 0.3758 (1.1596) lr 5.7422e-04 eta 13:55:30
epoch [38/50] batch [1600/2000] time 2.151 (2.053) data 0.000 (0.001) loss 0.8278 (1.1571) lr 5.7422e-04 eta 13:55:03
epoch [38/50] batch [1620/2000] time 2.037 (2.054) data 0.000 (0.001) loss 0.5045 (1.1550) lr 5.7422e-04 eta 13:54:27
epoch [38/50] batch [1640/2000] time 2.054 (2.053) data 0.000 (0.001) loss 1.0075 (1.1517) lr 5.7422e-04 eta 13:53:41
epoch [38/50] batch [1660/2000] time 2.065 (2.053) data 0.000 (0.001) loss 0.3501 (1.1526) lr 5.7422e-04 eta 13:52:57
epoch [38/50] batch [1680/2000] time 2.094 (2.053) data 0.001 (0.001) loss 1.7022 (1.1581) lr 5.7422e-04 eta 13:52:17
epoch [38/50] batch [1700/2000] time 2.021 (2.053) data 0.000 (0.001) loss 1.3328 (1.1597) lr 5.7422e-04 eta 13:51:37
epoch [38/50] batch [1720/2000] time 2.026 (2.053) data 0.000 (0.001) loss 0.0654 (1.1579) lr 5.7422e-04 eta 13:50:58
epoch [38/50] batch [1740/2000] time 2.049 (2.054) data 0.000 (0.001) loss 0.1400 (1.1609) lr 5.7422e-04 eta 13:50:18
epoch [38/50] batch [1760/2000] time 2.078 (2.054) data 0.000 (0.001) loss 1.6410 (1.1591) lr 5.7422e-04 eta 13:49:38
epoch [38/50] batch [1780/2000] time 2.009 (2.054) data 0.000 (0.001) loss 1.8746 (1.1578) lr 5.7422e-04 eta 13:48:57
epoch [38/50] batch [1800/2000] time 2.062 (2.054) data 0.000 (0.001) loss 3.3999 (1.1583) lr 5.7422e-04 eta 13:48:19
epoch [38/50] batch [1820/2000] time 2.069 (2.054) data 0.000 (0.001) loss 2.7672 (1.1572) lr 5.7422e-04 eta 13:47:46
epoch [38/50] batch [1840/2000] time 2.041 (2.054) data 0.000 (0.001) loss 0.0782 (1.1597) lr 5.7422e-04 eta 13:47:00
epoch [38/50] batch [1860/2000] time 2.044 (2.054) data 0.000 (0.001) loss 0.2527 (1.1580) lr 5.7422e-04 eta 13:46:22
epoch [38/50] batch [1880/2000] time 1.981 (2.054) data 0.000 (0.001) loss 0.5699 (1.1560) lr 5.7422e-04 eta 13:45:39
epoch [38/50] batch [1900/2000] time 2.018 (2.054) data 0.000 (0.001) loss 0.9545 (1.1536) lr 5.7422e-04 eta 13:44:59
epoch [38/50] batch [1920/2000] time 2.073 (2.054) data 0.000 (0.001) loss 0.4398 (1.1538) lr 5.7422e-04 eta 13:44:18
epoch [38/50] batch [1940/2000] time 2.122 (2.054) data 0.000 (0.001) loss 0.9284 (1.1558) lr 5.7422e-04 eta 13:43:39
epoch [38/50] batch [1960/2000] time 2.011 (2.054) data 0.000 (0.001) loss 2.3632 (1.1580) lr 5.7422e-04 eta 13:42:59
epoch [38/50] batch [1980/2000] time 2.014 (2.054) data 0.000 (0.001) loss 1.9625 (1.1626) lr 5.7422e-04 eta 13:42:22
epoch [38/50] batch [2000/2000] time 2.257 (2.054) data 0.000 (0.001) loss 2.2209 (1.1621) lr 5.1825e-04 eta 13:41:47
epoch [39/50] batch [20/2000] time 2.044 (2.125) data 0.000 (0.049) loss 1.3097 (0.9296) lr 5.1825e-04 eta 14:09:20
epoch [39/50] batch [40/2000] time 2.066 (2.093) data 0.000 (0.024) loss 0.4595 (1.0320) lr 5.1825e-04 eta 13:55:48
epoch [39/50] batch [60/2000] time 2.039 (2.080) data 0.001 (0.016) loss 0.2669 (1.0853) lr 5.1825e-04 eta 13:49:54
epoch [39/50] batch [80/2000] time 2.048 (2.072) data 0.000 (0.012) loss 3.1875 (1.2513) lr 5.1825e-04 eta 13:46:13
epoch [39/50] batch [100/2000] time 2.123 (2.070) data 0.000 (0.010) loss 0.2110 (1.2524) lr 5.1825e-04 eta 13:44:27
epoch [39/50] batch [120/2000] time 4.383 (2.431) data 0.001 (0.009) loss 0.5144 (1.2342) lr 5.1825e-04 eta 16:07:23
epoch [39/50] batch [140/2000] time 4.362 (2.697) data 0.000 (0.008) loss 1.0759 (1.2543) lr 5.1825e-04 eta 17:52:35
epoch [39/50] batch [160/2000] time 4.426 (2.896) data 0.000 (0.007) loss 1.7137 (1.2503) lr 5.1825e-04 eta 19:10:38
epoch [39/50] batch [180/2000] time 2.016 (2.856) data 0.000 (0.006) loss 1.0449 (1.2189) lr 5.1825e-04 eta 18:53:55
epoch [39/50] batch [200/2000] time 2.068 (2.776) data 0.000 (0.006) loss 1.4312 (1.2193) lr 5.1825e-04 eta 18:21:04
epoch [39/50] batch [220/2000] time 2.055 (2.710) data 0.001 (0.005) loss 0.1914 (1.1842) lr 5.1825e-04 eta 17:54:03
epoch [39/50] batch [240/2000] time 1.984 (2.655) data 0.000 (0.005) loss 1.4272 (1.1961) lr 5.1825e-04 eta 17:31:32
epoch [39/50] batch [260/2000] time 2.003 (2.611) data 0.004 (0.005) loss 0.4932 (1.1658) lr 5.1825e-04 eta 17:12:53
epoch [39/50] batch [280/2000] time 2.001 (2.571) data 0.000 (0.004) loss 0.6210 (1.1785) lr 5.1825e-04 eta 16:56:26
epoch [39/50] batch [300/2000] time 4.389 (2.664) data 0.001 (0.004) loss 2.1471 (1.1900) lr 5.1825e-04 eta 17:32:21
epoch [39/50] batch [320/2000] time 2.014 (2.693) data 0.000 (0.004) loss 1.0047 (1.1779) lr 5.1825e-04 eta 17:42:53
epoch [39/50] batch [340/2000] time 2.047 (2.656) data 0.000 (0.004) loss 0.0382 (1.1639) lr 5.1825e-04 eta 17:27:18
epoch [39/50] batch [360/2000] time 2.091 (2.622) data 0.000 (0.003) loss 2.0189 (1.1702) lr 5.1825e-04 eta 17:13:04
epoch [39/50] batch [380/2000] time 2.061 (2.592) data 0.000 (0.003) loss 0.3693 (1.1561) lr 5.1825e-04 eta 17:00:29
epoch [39/50] batch [400/2000] time 2.026 (2.566) data 0.000 (0.003) loss 0.2370 (1.1465) lr 5.1825e-04 eta 16:49:07
epoch [39/50] batch [420/2000] time 2.070 (2.541) data 0.000 (0.003) loss 3.1626 (1.1578) lr 5.1825e-04 eta 16:38:43
epoch [39/50] batch [440/2000] time 2.050 (2.519) data 0.000 (0.003) loss 0.6823 (1.1528) lr 5.1825e-04 eta 16:29:17
epoch [39/50] batch [460/2000] time 2.059 (2.499) data 0.000 (0.003) loss 3.1497 (1.1616) lr 5.1825e-04 eta 16:20:23
epoch [39/50] batch [480/2000] time 2.075 (2.481) data 0.000 (0.003) loss 0.1735 (1.1584) lr 5.1825e-04 eta 16:12:27
epoch [39/50] batch [500/2000] time 2.012 (2.464) data 0.000 (0.003) loss 0.3749 (1.1646) lr 5.1825e-04 eta 16:04:54
epoch [39/50] batch [520/2000] time 2.057 (2.448) data 0.000 (0.003) loss 1.7646 (1.1521) lr 5.1825e-04 eta 15:57:48
epoch [39/50] batch [540/2000] time 2.022 (2.433) data 0.000 (0.003) loss 1.9406 (1.1584) lr 5.1825e-04 eta 15:51:19
epoch [39/50] batch [560/2000] time 2.041 (2.420) data 0.000 (0.002) loss 0.2723 (1.1582) lr 5.1825e-04 eta 15:45:32
epoch [39/50] batch [580/2000] time 2.049 (2.407) data 0.002 (0.002) loss 1.1850 (1.1528) lr 5.1825e-04 eta 15:39:42
epoch [39/50] batch [600/2000] time 2.005 (2.395) data 0.001 (0.002) loss 0.9672 (1.1471) lr 5.1825e-04 eta 15:34:05
epoch [39/50] batch [620/2000] time 2.009 (2.384) data 0.000 (0.002) loss 0.0957 (1.1388) lr 5.1825e-04 eta 15:28:51
epoch [39/50] batch [640/2000] time 2.045 (2.373) data 0.000 (0.002) loss 1.5521 (1.1494) lr 5.1825e-04 eta 15:24:02
epoch [39/50] batch [660/2000] time 2.043 (2.364) data 0.000 (0.002) loss 1.5548 (1.1550) lr 5.1825e-04 eta 15:19:33
epoch [39/50] batch [680/2000] time 2.060 (2.354) data 0.000 (0.002) loss 0.3622 (1.1487) lr 5.1825e-04 eta 15:15:04
epoch [39/50] batch [700/2000] time 2.067 (2.346) data 0.000 (0.002) loss 0.4021 (1.1495) lr 5.1825e-04 eta 15:10:53
epoch [39/50] batch [720/2000] time 2.172 (2.338) data 0.000 (0.002) loss 0.0444 (1.1385) lr 5.1825e-04 eta 15:07:12
epoch [39/50] batch [740/2000] time 2.084 (2.330) data 0.000 (0.002) loss 0.5304 (1.1363) lr 5.1825e-04 eta 15:03:21
epoch [39/50] batch [760/2000] time 2.067 (2.323) data 0.000 (0.002) loss 0.2506 (1.1340) lr 5.1825e-04 eta 14:59:46
epoch [39/50] batch [780/2000] time 2.070 (2.316) data 0.000 (0.002) loss 1.9975 (1.1350) lr 5.1825e-04 eta 14:56:21
epoch [39/50] batch [800/2000] time 2.072 (2.310) data 0.000 (0.002) loss 1.0730 (1.1371) lr 5.1825e-04 eta 14:53:01
epoch [39/50] batch [820/2000] time 2.086 (2.303) data 0.000 (0.002) loss 1.1095 (1.1321) lr 5.1825e-04 eta 14:49:50
epoch [39/50] batch [840/2000] time 2.077 (2.297) data 0.000 (0.002) loss 0.5631 (1.1349) lr 5.1825e-04 eta 14:46:49
epoch [39/50] batch [860/2000] time 2.065 (2.292) data 0.000 (0.002) loss 0.2791 (1.1326) lr 5.1825e-04 eta 14:43:52
epoch [39/50] batch [880/2000] time 2.096 (2.287) data 0.000 (0.002) loss 1.3762 (1.1334) lr 5.1825e-04 eta 14:41:04
epoch [39/50] batch [900/2000] time 2.169 (2.282) data 0.000 (0.002) loss 0.7784 (1.1319) lr 5.1825e-04 eta 14:38:43
epoch [39/50] batch [920/2000] time 2.126 (2.278) data 0.002 (0.002) loss 2.8871 (1.1325) lr 5.1825e-04 eta 14:36:19
epoch [39/50] batch [940/2000] time 1.998 (2.274) data 0.004 (0.002) loss 2.9620 (1.1364) lr 5.1825e-04 eta 14:33:48
epoch [39/50] batch [960/2000] time 2.070 (2.269) data 0.000 (0.002) loss 0.6921 (1.1363) lr 5.1825e-04 eta 14:31:20
epoch [39/50] batch [980/2000] time 2.072 (2.265) data 0.000 (0.002) loss 0.5048 (1.1360) lr 5.1825e-04 eta 14:28:59
epoch [39/50] batch [1000/2000] time 2.062 (2.260) data 0.000 (0.002) loss 0.9149 (1.1381) lr 5.1825e-04 eta 14:26:31
epoch [39/50] batch [1020/2000] time 2.074 (2.256) data 0.000 (0.002) loss 3.0147 (1.1389) lr 5.1825e-04 eta 14:24:04
epoch [39/50] batch [1040/2000] time 2.071 (2.252) data 0.000 (0.002) loss 1.3395 (1.1401) lr 5.1825e-04 eta 14:21:45
epoch [39/50] batch [1060/2000] time 2.007 (2.248) data 0.000 (0.002) loss 0.7485 (1.1432) lr 5.1825e-04 eta 14:19:32
epoch [39/50] batch [1080/2000] time 2.050 (2.245) data 0.005 (0.002) loss 0.3982 (1.1563) lr 5.1825e-04 eta 14:17:24
epoch [39/50] batch [1100/2000] time 2.075 (2.241) data 0.000 (0.002) loss 1.4137 (1.1539) lr 5.1825e-04 eta 14:15:20
epoch [39/50] batch [1120/2000] time 2.051 (2.238) data 0.000 (0.002) loss 1.9527 (1.1448) lr 5.1825e-04 eta 14:13:18
epoch [39/50] batch [1140/2000] time 2.064 (2.235) data 0.001 (0.002) loss 1.3442 (1.1492) lr 5.1825e-04 eta 14:11:22
epoch [39/50] batch [1160/2000] time 2.002 (2.232) data 0.000 (0.002) loss 1.8218 (1.1464) lr 5.1825e-04 eta 14:09:32
epoch [39/50] batch [1180/2000] time 2.081 (2.229) data 0.000 (0.002) loss 0.2368 (1.1460) lr 5.1825e-04 eta 14:07:37
epoch [39/50] batch [1200/2000] time 2.052 (2.226) data 0.000 (0.002) loss 0.8494 (1.1439) lr 5.1825e-04 eta 14:05:48
epoch [39/50] batch [1220/2000] time 2.048 (2.223) data 0.000 (0.002) loss 0.0999 (1.1436) lr 5.1825e-04 eta 14:04:00
epoch [39/50] batch [1240/2000] time 2.096 (2.221) data 0.001 (0.002) loss 0.2995 (1.1523) lr 5.1825e-04 eta 14:02:26
epoch [39/50] batch [1260/2000] time 2.043 (2.218) data 0.000 (0.002) loss 2.3913 (1.1507) lr 5.1825e-04 eta 14:00:38
epoch [39/50] batch [1280/2000] time 2.030 (2.215) data 0.000 (0.002) loss 1.3672 (1.1552) lr 5.1825e-04 eta 13:58:55
epoch [39/50] batch [1300/2000] time 1.985 (2.213) data 0.000 (0.002) loss 1.4079 (1.1545) lr 5.1825e-04 eta 13:57:14
epoch [39/50] batch [1320/2000] time 2.090 (2.211) data 0.000 (0.002) loss 2.8220 (1.1608) lr 5.1825e-04 eta 13:55:35
epoch [39/50] batch [1340/2000] time 2.031 (2.208) data 0.000 (0.002) loss 2.3991 (1.1606) lr 5.1825e-04 eta 13:53:55
epoch [39/50] batch [1360/2000] time 2.012 (2.206) data 0.000 (0.002) loss 2.2274 (1.1602) lr 5.1825e-04 eta 13:52:21
epoch [39/50] batch [1380/2000] time 2.017 (2.204) data 0.001 (0.002) loss 2.0533 (1.1603) lr 5.1825e-04 eta 13:50:45
epoch [39/50] batch [1400/2000] time 2.046 (2.201) data 0.000 (0.001) loss 0.4419 (1.1633) lr 5.1825e-04 eta 13:49:10
epoch [39/50] batch [1420/2000] time 2.010 (2.199) data 0.000 (0.001) loss 1.1038 (1.1663) lr 5.1825e-04 eta 13:47:33
epoch [39/50] batch [1440/2000] time 2.065 (2.197) data 0.000 (0.001) loss 0.9375 (1.1660) lr 5.1825e-04 eta 13:46:01
epoch [39/50] batch [1460/2000] time 2.058 (2.195) data 0.000 (0.001) loss 0.5966 (1.1656) lr 5.1825e-04 eta 13:44:30
epoch [39/50] batch [1480/2000] time 2.001 (2.193) data 0.000 (0.001) loss 2.7257 (1.1635) lr 5.1825e-04 eta 13:42:59
epoch [39/50] batch [1500/2000] time 2.043 (2.191) data 0.000 (0.001) loss 0.3326 (1.1611) lr 5.1825e-04 eta 13:41:32
epoch [39/50] batch [1520/2000] time 2.078 (2.189) data 0.003 (0.001) loss 3.6224 (1.1671) lr 5.1825e-04 eta 13:40:02
epoch [39/50] batch [1540/2000] time 2.021 (2.187) data 0.000 (0.001) loss 0.2653 (1.1650) lr 5.1825e-04 eta 13:38:39
epoch [39/50] batch [1560/2000] time 2.016 (2.185) data 0.000 (0.001) loss 1.0098 (1.1621) lr 5.1825e-04 eta 13:37:14
epoch [39/50] batch [1580/2000] time 2.048 (2.183) data 0.000 (0.001) loss 0.5197 (1.1625) lr 5.1825e-04 eta 13:35:52
epoch [39/50] batch [1600/2000] time 2.128 (2.182) data 0.000 (0.001) loss 1.1299 (1.1617) lr 5.1825e-04 eta 13:34:29
epoch [39/50] batch [1620/2000] time 2.008 (2.180) data 0.000 (0.001) loss 4.4295 (1.1641) lr 5.1825e-04 eta 13:33:12
epoch [39/50] batch [1640/2000] time 2.092 (2.179) data 0.003 (0.001) loss 0.6837 (1.1628) lr 5.1825e-04 eta 13:31:53
epoch [39/50] batch [1660/2000] time 2.136 (2.178) data 0.001 (0.001) loss 0.1241 (1.1610) lr 5.1825e-04 eta 13:30:53
epoch [39/50] batch [1680/2000] time 2.088 (2.177) data 0.001 (0.001) loss 1.4003 (1.1543) lr 5.1825e-04 eta 13:29:39
epoch [39/50] batch [1700/2000] time 2.076 (2.175) data 0.000 (0.001) loss 3.2645 (1.1561) lr 5.1825e-04 eta 13:28:29
epoch [39/50] batch [1720/2000] time 2.046 (2.174) data 0.000 (0.001) loss 1.1192 (1.1552) lr 5.1825e-04 eta 13:27:12
epoch [39/50] batch [1740/2000] time 2.014 (2.172) data 0.005 (0.001) loss 1.9262 (1.1580) lr 5.1825e-04 eta 13:25:57
epoch [39/50] batch [1760/2000] time 2.023 (2.171) data 0.001 (0.001) loss 1.7338 (1.1544) lr 5.1825e-04 eta 13:24:42
epoch [39/50] batch [1780/2000] time 2.039 (2.170) data 0.000 (0.001) loss 1.8831 (1.1539) lr 5.1825e-04 eta 13:23:28
epoch [39/50] batch [1800/2000] time 2.017 (2.168) data 0.000 (0.001) loss 0.2428 (1.1518) lr 5.1825e-04 eta 13:22:13
epoch [39/50] batch [1820/2000] time 2.058 (2.167) data 0.000 (0.001) loss 1.8174 (1.1533) lr 5.1825e-04 eta 13:21:00
epoch [39/50] batch [1840/2000] time 2.075 (2.166) data 0.001 (0.001) loss 1.3619 (1.1587) lr 5.1825e-04 eta 13:19:50
epoch [39/50] batch [1860/2000] time 2.076 (2.164) data 0.000 (0.001) loss 0.4755 (1.1584) lr 5.1825e-04 eta 13:18:39
epoch [39/50] batch [1880/2000] time 2.096 (2.163) data 0.000 (0.001) loss 0.6103 (1.1601) lr 5.1825e-04 eta 13:17:29
epoch [39/50] batch [1900/2000] time 2.036 (2.162) data 0.000 (0.001) loss 0.4028 (1.1603) lr 5.1825e-04 eta 13:16:21
epoch [39/50] batch [1920/2000] time 2.062 (2.161) data 0.000 (0.001) loss 0.1079 (1.1623) lr 5.1825e-04 eta 13:15:10
epoch [39/50] batch [1940/2000] time 2.120 (2.160) data 0.000 (0.001) loss 1.0147 (1.1604) lr 5.1825e-04 eta 13:14:06
epoch [39/50] batch [1960/2000] time 2.046 (2.159) data 0.001 (0.001) loss 1.2162 (1.1621) lr 5.1825e-04 eta 13:13:01
epoch [39/50] batch [1980/2000] time 2.062 (2.158) data 0.000 (0.001) loss 1.8420 (1.1630) lr 5.1825e-04 eta 13:11:53
epoch [39/50] batch [2000/2000] time 2.071 (2.157) data 0.000 (0.001) loss 1.2306 (1.1639) lr 4.6417e-04 eta 13:10:48
epoch [40/50] batch [20/2000] time 2.097 (2.103) data 0.000 (0.038) loss 0.6320 (0.8292) lr 4.6417e-04 eta 12:50:27
epoch [40/50] batch [40/2000] time 2.006 (2.080) data 0.000 (0.019) loss 0.2715 (0.8500) lr 4.6417e-04 eta 12:41:25
epoch [40/50] batch [60/2000] time 2.082 (2.069) data 0.001 (0.013) loss 0.1629 (0.8388) lr 4.6417e-04 eta 12:36:23
epoch [40/50] batch [80/2000] time 2.058 (2.065) data 0.000 (0.010) loss 0.2233 (0.8914) lr 4.6417e-04 eta 12:34:29
epoch [40/50] batch [100/2000] time 2.086 (2.065) data 0.000 (0.008) loss 0.0214 (0.9396) lr 4.6417e-04 eta 12:33:53
epoch [40/50] batch [120/2000] time 2.055 (2.067) data 0.000 (0.007) loss 2.3019 (0.9845) lr 4.6417e-04 eta 12:33:37
epoch [40/50] batch [140/2000] time 2.069 (2.062) data 0.000 (0.006) loss 1.0368 (0.9885) lr 4.6417e-04 eta 12:31:22
epoch [40/50] batch [160/2000] time 2.060 (2.061) data 0.000 (0.005) loss 0.2757 (0.9992) lr 4.6417e-04 eta 12:30:06
epoch [40/50] batch [180/2000] time 2.270 (2.060) data 0.000 (0.005) loss 0.1428 (1.0137) lr 4.6417e-04 eta 12:29:11
epoch [40/50] batch [200/2000] time 2.094 (2.060) data 0.000 (0.004) loss 3.0346 (1.0358) lr 4.6417e-04 eta 12:28:20
epoch [40/50] batch [220/2000] time 2.067 (2.060) data 0.000 (0.004) loss 1.6877 (1.0324) lr 4.6417e-04 eta 12:27:41
epoch [40/50] batch [240/2000] time 2.059 (2.059) data 0.000 (0.004) loss 1.6199 (1.0250) lr 4.6417e-04 eta 12:26:38
epoch [40/50] batch [260/2000] time 2.081 (2.058) data 0.000 (0.003) loss 1.4881 (1.0243) lr 4.6417e-04 eta 12:25:43
epoch [40/50] batch [280/2000] time 2.042 (2.059) data 0.000 (0.003) loss 0.7060 (1.0300) lr 4.6417e-04 eta 12:25:10
epoch [40/50] batch [300/2000] time 2.084 (2.058) data 0.001 (0.003) loss 1.6408 (1.0289) lr 4.6417e-04 eta 12:24:15
epoch [40/50] batch [320/2000] time 2.192 (2.057) data 0.000 (0.003) loss 2.8921 (1.0738) lr 4.6417e-04 eta 12:23:17
epoch [40/50] batch [340/2000] time 2.076 (2.056) data 0.000 (0.003) loss 2.0807 (1.0650) lr 4.6417e-04 eta 12:22:18
epoch [40/50] batch [360/2000] time 2.061 (2.057) data 0.000 (0.003) loss 1.9639 (1.0800) lr 4.6417e-04 eta 12:21:55
epoch [40/50] batch [380/2000] time 2.086 (2.057) data 0.000 (0.003) loss 1.6097 (1.0979) lr 4.6417e-04 eta 12:21:18
epoch [40/50] batch [400/2000] time 1.987 (2.057) data 0.000 (0.002) loss 1.0823 (1.1143) lr 4.6417e-04 eta 12:20:28
epoch [40/50] batch [420/2000] time 2.072 (2.057) data 0.000 (0.002) loss 0.0396 (1.1052) lr 4.6417e-04 eta 12:19:52
epoch [40/50] batch [440/2000] time 2.068 (2.058) data 0.000 (0.002) loss 2.5073 (1.1147) lr 4.6417e-04 eta 12:19:20
epoch [40/50] batch [460/2000] time 2.011 (2.057) data 0.000 (0.002) loss 0.5234 (1.1180) lr 4.6417e-04 eta 12:18:35
epoch [40/50] batch [480/2000] time 2.064 (2.057) data 0.000 (0.002) loss 0.4935 (1.1117) lr 4.6417e-04 eta 12:17:46
epoch [40/50] batch [500/2000] time 2.031 (2.057) data 0.000 (0.002) loss 3.7032 (1.1167) lr 4.6417e-04 eta 12:17:05
epoch [40/50] batch [520/2000] time 2.081 (2.057) data 0.000 (0.002) loss 0.4401 (1.1047) lr 4.6417e-04 eta 12:16:28
epoch [40/50] batch [540/2000] time 2.039 (2.057) data 0.000 (0.002) loss 0.3394 (1.1007) lr 4.6417e-04 eta 12:15:48
epoch [40/50] batch [560/2000] time 2.060 (2.057) data 0.000 (0.002) loss 0.9145 (1.1025) lr 4.6417e-04 eta 12:15:00
epoch [40/50] batch [580/2000] time 2.006 (2.056) data 0.000 (0.002) loss 0.4894 (1.1042) lr 4.6417e-04 eta 12:14:07
epoch [40/50] batch [600/2000] time 2.067 (2.056) data 0.001 (0.002) loss 2.8930 (1.1159) lr 4.6417e-04 eta 12:13:14
epoch [40/50] batch [620/2000] time 2.063 (2.055) data 0.000 (0.002) loss 0.4971 (1.1190) lr 4.6417e-04 eta 12:12:19
epoch [40/50] batch [640/2000] time 2.064 (2.055) data 0.000 (0.002) loss 0.7334 (1.1160) lr 4.6417e-04 eta 12:11:38
epoch [40/50] batch [660/2000] time 2.173 (2.055) data 0.000 (0.002) loss 0.0237 (1.1279) lr 4.6417e-04 eta 12:10:50
epoch [40/50] batch [680/2000] time 2.040 (2.054) data 0.000 (0.002) loss 0.1639 (1.1219) lr 4.6417e-04 eta 12:10:00
epoch [40/50] batch [700/2000] time 2.069 (2.054) data 0.000 (0.002) loss 0.5221 (1.1164) lr 4.6417e-04 eta 12:09:16
epoch [40/50] batch [720/2000] time 2.040 (2.054) data 0.000 (0.002) loss 0.3765 (1.1162) lr 4.6417e-04 eta 12:08:27
epoch [40/50] batch [740/2000] time 2.060 (2.054) data 0.000 (0.002) loss 0.1899 (1.1133) lr 4.6417e-04 eta 12:07:42
epoch [40/50] batch [760/2000] time 2.064 (2.053) data 0.000 (0.002) loss 1.0922 (1.1090) lr 4.6417e-04 eta 12:06:53
epoch [40/50] batch [780/2000] time 2.034 (2.053) data 0.000 (0.002) loss 1.8121 (1.1062) lr 4.6417e-04 eta 12:06:07
epoch [40/50] batch [800/2000] time 2.065 (2.053) data 0.000 (0.001) loss 0.2514 (1.1024) lr 4.6417e-04 eta 12:05:23
epoch [40/50] batch [820/2000] time 2.065 (2.053) data 0.000 (0.001) loss 1.4041 (1.1039) lr 4.6417e-04 eta 12:04:35
epoch [40/50] batch [840/2000] time 2.059 (2.052) data 0.000 (0.001) loss 0.9537 (1.1122) lr 4.6417e-04 eta 12:03:46
epoch [40/50] batch [860/2000] time 2.017 (2.052) data 0.001 (0.001) loss 0.9044 (1.1132) lr 4.6417e-04 eta 12:03:01
epoch [40/50] batch [880/2000] time 2.049 (2.052) data 0.000 (0.001) loss 1.8760 (1.1135) lr 4.6417e-04 eta 12:02:13
epoch [40/50] batch [900/2000] time 2.037 (2.051) data 0.000 (0.001) loss 1.6976 (1.1208) lr 4.6417e-04 eta 12:01:25
epoch [40/50] batch [920/2000] time 2.043 (2.051) data 0.001 (0.001) loss 2.0576 (1.1215) lr 4.6417e-04 eta 12:00:37
epoch [40/50] batch [940/2000] time 2.040 (2.051) data 0.000 (0.001) loss 0.7772 (1.1236) lr 4.6417e-04 eta 11:59:46
epoch [40/50] batch [960/2000] time 2.034 (2.050) data 0.000 (0.001) loss 0.2825 (1.1273) lr 4.6417e-04 eta 11:58:57
epoch [40/50] batch [980/2000] time 2.064 (2.050) data 0.000 (0.001) loss 1.2225 (1.1240) lr 4.6417e-04 eta 11:58:11
epoch [40/50] batch [1000/2000] time 2.009 (2.050) data 0.000 (0.001) loss 0.2768 (1.1224) lr 4.6417e-04 eta 11:57:26
epoch [40/50] batch [1020/2000] time 2.068 (2.050) data 0.000 (0.001) loss 1.1773 (1.1187) lr 4.6417e-04 eta 11:56:42
epoch [40/50] batch [1040/2000] time 2.007 (2.050) data 0.000 (0.001) loss 1.5151 (1.1259) lr 4.6417e-04 eta 11:56:01
epoch [40/50] batch [1060/2000] time 2.059 (2.050) data 0.000 (0.001) loss 0.8187 (1.1275) lr 4.6417e-04 eta 11:55:18
epoch [40/50] batch [1080/2000] time 2.007 (2.049) data 0.000 (0.001) loss 0.3050 (1.1344) lr 4.6417e-04 eta 11:54:31
epoch [40/50] batch [1100/2000] time 2.010 (2.049) data 0.000 (0.001) loss 1.9551 (1.1369) lr 4.6417e-04 eta 11:53:50
epoch [40/50] batch [1120/2000] time 2.041 (2.049) data 0.000 (0.001) loss 1.3687 (1.1319) lr 4.6417e-04 eta 11:53:08
epoch [40/50] batch [1140/2000] time 2.009 (2.049) data 0.001 (0.001) loss 0.1012 (1.1389) lr 4.6417e-04 eta 11:52:25
epoch [40/50] batch [1160/2000] time 2.063 (2.049) data 0.000 (0.001) loss 1.1193 (1.1445) lr 4.6417e-04 eta 11:51:43
epoch [40/50] batch [1180/2000] time 2.075 (2.049) data 0.000 (0.001) loss 1.1026 (1.1402) lr 4.6417e-04 eta 11:51:01
epoch [40/50] batch [1200/2000] time 2.041 (2.049) data 0.000 (0.001) loss 0.0668 (1.1425) lr 4.6417e-04 eta 11:50:16
epoch [40/50] batch [1220/2000] time 2.005 (2.049) data 0.000 (0.001) loss 2.5592 (1.1448) lr 4.6417e-04 eta 11:49:28
epoch [40/50] batch [1240/2000] time 2.032 (2.048) data 0.000 (0.001) loss 0.0636 (1.1437) lr 4.6417e-04 eta 11:48:44
epoch [40/50] batch [1260/2000] time 2.053 (2.048) data 0.000 (0.001) loss 1.0839 (1.1430) lr 4.6417e-04 eta 11:47:58
epoch [40/50] batch [1280/2000] time 2.058 (2.048) data 0.000 (0.001) loss 2.0588 (1.1436) lr 4.6417e-04 eta 11:47:11
epoch [40/50] batch [1300/2000] time 2.001 (2.048) data 0.000 (0.001) loss 0.6949 (1.1413) lr 4.6417e-04 eta 11:46:27
epoch [40/50] batch [1320/2000] time 2.007 (2.047) data 0.000 (0.001) loss 0.3498 (1.1375) lr 4.6417e-04 eta 11:45:40
epoch [40/50] batch [1340/2000] time 1.978 (2.047) data 0.000 (0.001) loss 1.2680 (1.1322) lr 4.6417e-04 eta 11:44:59
epoch [40/50] batch [1360/2000] time 2.032 (2.047) data 0.000 (0.001) loss 0.2275 (1.1337) lr 4.6417e-04 eta 11:44:13
epoch [40/50] batch [1380/2000] time 2.057 (2.047) data 0.000 (0.001) loss 0.4922 (1.1292) lr 4.6417e-04 eta 11:43:29
epoch [40/50] batch [1400/2000] time 2.004 (2.047) data 0.000 (0.001) loss 0.9750 (1.1289) lr 4.6417e-04 eta 11:42:44
epoch [40/50] batch [1420/2000] time 2.057 (2.047) data 0.000 (0.001) loss 2.3969 (1.1307) lr 4.6417e-04 eta 11:42:01
epoch [40/50] batch [1440/2000] time 2.034 (2.047) data 0.000 (0.001) loss 1.3946 (1.1338) lr 4.6417e-04 eta 11:41:17
epoch [40/50] batch [1460/2000] time 2.032 (2.046) data 0.000 (0.001) loss 1.8725 (1.1343) lr 4.6417e-04 eta 11:40:32
epoch [40/50] batch [1480/2000] time 2.083 (2.046) data 0.000 (0.001) loss 0.4836 (1.1347) lr 4.6417e-04 eta 11:39:50
epoch [40/50] batch [1500/2000] time 2.002 (2.046) data 0.000 (0.001) loss 0.1641 (1.1311) lr 4.6417e-04 eta 11:39:05
epoch [40/50] batch [1520/2000] time 2.057 (2.046) data 0.000 (0.001) loss 1.5144 (1.1318) lr 4.6417e-04 eta 11:38:20
epoch [40/50] batch [1540/2000] time 2.002 (2.046) data 0.000 (0.001) loss 0.7508 (1.1285) lr 4.6417e-04 eta 11:37:36
epoch [40/50] batch [1560/2000] time 2.004 (2.046) data 0.000 (0.001) loss 0.6485 (1.1310) lr 4.6417e-04 eta 11:36:51
epoch [40/50] batch [1580/2000] time 2.057 (2.045) data 0.000 (0.001) loss 2.6863 (1.1323) lr 4.6417e-04 eta 11:36:08
epoch [40/50] batch [1600/2000] time 2.033 (2.045) data 0.000 (0.001) loss 3.2101 (1.1314) lr 4.6417e-04 eta 11:35:25
epoch [40/50] batch [1620/2000] time 2.002 (2.045) data 0.000 (0.001) loss 1.2014 (1.1352) lr 4.6417e-04 eta 11:34:40
epoch [40/50] batch [1640/2000] time 2.000 (2.045) data 0.000 (0.001) loss 3.7604 (1.1365) lr 4.6417e-04 eta 11:33:58
epoch [40/50] batch [1660/2000] time 2.004 (2.045) data 0.000 (0.001) loss 2.3359 (1.1396) lr 4.6417e-04 eta 11:33:12
epoch [40/50] batch [1680/2000] time 2.054 (2.045) data 0.001 (0.001) loss 0.6307 (1.1397) lr 4.6417e-04 eta 11:32:28
epoch [40/50] batch [1700/2000] time 2.061 (2.045) data 0.000 (0.001) loss 1.5899 (1.1396) lr 4.6417e-04 eta 11:31:44
epoch [40/50] batch [1720/2000] time 2.037 (2.044) data 0.000 (0.001) loss 1.0152 (1.1353) lr 4.6417e-04 eta 11:31:02
epoch [40/50] batch [1740/2000] time 2.056 (2.044) data 0.000 (0.001) loss 0.5911 (1.1344) lr 4.6417e-04 eta 11:30:19
epoch [40/50] batch [1760/2000] time 2.007 (2.044) data 0.000 (0.001) loss 0.5915 (1.1356) lr 4.6417e-04 eta 11:29:34
epoch [40/50] batch [1780/2000] time 2.068 (2.044) data 0.000 (0.001) loss 0.2034 (1.1372) lr 4.6417e-04 eta 11:28:54
epoch [40/50] batch [1800/2000] time 2.007 (2.044) data 0.000 (0.001) loss 2.9613 (1.1362) lr 4.6417e-04 eta 11:28:11
epoch [40/50] batch [1820/2000] time 2.063 (2.044) data 0.000 (0.001) loss 0.0884 (1.1364) lr 4.6417e-04 eta 11:27:29
epoch [40/50] batch [1840/2000] time 2.934 (2.046) data 0.000 (0.001) loss 1.6901 (1.1398) lr 4.6417e-04 eta 11:27:22
epoch [40/50] batch [1860/2000] time 2.041 (2.048) data 0.000 (0.001) loss 1.4403 (1.1409) lr 4.6417e-04 eta 11:27:17
epoch [40/50] batch [1880/2000] time 2.060 (2.049) data 0.000 (0.001) loss 0.1697 (1.1422) lr 4.6417e-04 eta 11:27:05
epoch [40/50] batch [1900/2000] time 2.122 (2.052) data 0.000 (0.001) loss 0.7509 (1.1431) lr 4.6417e-04 eta 11:27:26
epoch [40/50] batch [1920/2000] time 2.084 (2.055) data 0.000 (0.001) loss 2.0581 (1.1441) lr 4.6417e-04 eta 11:27:38
epoch [40/50] batch [1940/2000] time 2.066 (2.057) data 0.000 (0.001) loss 0.0286 (1.1445) lr 4.6417e-04 eta 11:27:34
epoch [40/50] batch [1960/2000] time 2.202 (2.061) data 0.000 (0.001) loss 0.1598 (1.1440) lr 4.6417e-04 eta 11:28:27
epoch [40/50] batch [1980/2000] time 2.014 (2.069) data 0.005 (0.001) loss 1.1193 (1.1402) lr 4.6417e-04 eta 11:30:25
epoch [40/50] batch [2000/2000] time 4.361 (2.072) data 0.000 (0.001) loss 4.2081 (1.1401) lr 4.1221e-04 eta 11:30:46
epoch [41/50] batch [20/2000] time 4.299 (2.300) data 0.001 (0.035) loss 0.7810 (1.6348) lr 4.1221e-04 eta 12:45:52
epoch [41/50] batch [40/2000] time 2.357 (2.403) data 0.000 (0.018) loss 1.4158 (1.6898) lr 4.1221e-04 eta 13:19:27
epoch [41/50] batch [60/2000] time 2.050 (2.524) data 0.001 (0.012) loss 1.7648 (1.5281) lr 4.1221e-04 eta 13:58:54
epoch [41/50] batch [80/2000] time 2.066 (2.440) data 0.000 (0.009) loss 0.2625 (1.3634) lr 4.1221e-04 eta 13:30:05
epoch [41/50] batch [100/2000] time 2.065 (2.401) data 0.000 (0.008) loss 1.1420 (1.3367) lr 4.1221e-04 eta 13:16:16
epoch [41/50] batch [120/2000] time 2.036 (2.383) data 0.000 (0.006) loss 1.5175 (1.3158) lr 4.1221e-04 eta 13:09:35
epoch [41/50] batch [140/2000] time 1.980 (2.375) data 0.000 (0.006) loss 1.1024 (1.3051) lr 4.1221e-04 eta 13:06:06
epoch [41/50] batch [160/2000] time 2.121 (2.371) data 0.000 (0.005) loss 0.6496 (1.2532) lr 4.1221e-04 eta 13:04:00
epoch [41/50] batch [180/2000] time 2.059 (2.370) data 0.000 (0.005) loss 1.8460 (1.2605) lr 4.1221e-04 eta 13:02:59
epoch [41/50] batch [200/2000] time 2.006 (2.367) data 0.000 (0.004) loss 0.2854 (1.2027) lr 4.1221e-04 eta 13:01:14
epoch [41/50] batch [220/2000] time 2.007 (2.354) data 0.000 (0.004) loss 1.9438 (1.2063) lr 4.1221e-04 eta 12:56:11
epoch [41/50] batch [240/2000] time 2.062 (2.337) data 0.000 (0.004) loss 2.5724 (1.2096) lr 4.1221e-04 eta 12:49:30
epoch [41/50] batch [260/2000] time 2.063 (2.314) data 0.000 (0.003) loss 0.7618 (1.2003) lr 4.1221e-04 eta 12:41:26
epoch [41/50] batch [280/2000] time 2.063 (2.295) data 0.000 (0.003) loss 0.2367 (1.2005) lr 4.1221e-04 eta 12:34:21
epoch [41/50] batch [300/2000] time 2.063 (2.278) data 0.000 (0.003) loss 0.6182 (1.2057) lr 4.1221e-04 eta 12:28:04
epoch [41/50] batch [320/2000] time 2.036 (2.264) data 0.000 (0.003) loss 0.1325 (1.2162) lr 4.1221e-04 eta 12:22:32
epoch [41/50] batch [340/2000] time 2.003 (2.250) data 0.000 (0.003) loss 1.6676 (1.2304) lr 4.1221e-04 eta 12:17:23
epoch [41/50] batch [360/2000] time 1.980 (2.238) data 0.000 (0.003) loss 0.6822 (1.2458) lr 4.1221e-04 eta 12:12:41
epoch [41/50] batch [380/2000] time 2.000 (2.228) data 0.000 (0.002) loss 1.4864 (1.2375) lr 4.1221e-04 eta 12:08:28
epoch [41/50] batch [400/2000] time 2.005 (2.218) data 0.000 (0.002) loss 0.9267 (1.2432) lr 4.1221e-04 eta 12:04:32
epoch [41/50] batch [420/2000] time 2.061 (2.210) data 0.000 (0.002) loss 1.5417 (1.2278) lr 4.1221e-04 eta 12:01:04
epoch [41/50] batch [440/2000] time 2.037 (2.202) data 0.000 (0.002) loss 2.3245 (1.2180) lr 4.1221e-04 eta 11:57:41
epoch [41/50] batch [460/2000] time 2.076 (2.194) data 0.000 (0.002) loss 1.9929 (1.2108) lr 4.1221e-04 eta 11:54:39
epoch [41/50] batch [480/2000] time 2.057 (2.188) data 0.000 (0.002) loss 0.2407 (1.2015) lr 4.1221e-04 eta 11:51:55
epoch [41/50] batch [500/2000] time 2.064 (2.182) data 0.000 (0.002) loss 0.1751 (1.1971) lr 4.1221e-04 eta 11:49:15
epoch [41/50] batch [520/2000] time 1.986 (2.177) data 0.000 (0.002) loss 1.8996 (1.2031) lr 4.1221e-04 eta 11:46:41
epoch [41/50] batch [540/2000] time 2.065 (2.172) data 0.000 (0.002) loss 0.7297 (1.1968) lr 4.1221e-04 eta 11:44:22
epoch [41/50] batch [560/2000] time 2.008 (2.167) data 0.000 (0.002) loss 1.7872 (1.2015) lr 4.1221e-04 eta 11:42:12
epoch [41/50] batch [580/2000] time 2.040 (2.163) data 0.000 (0.002) loss 0.7618 (1.1948) lr 4.1221e-04 eta 11:40:03
epoch [41/50] batch [600/2000] time 2.008 (2.159) data 0.001 (0.002) loss 0.3959 (1.1818) lr 4.1221e-04 eta 11:37:59
epoch [41/50] batch [620/2000] time 2.059 (2.155) data 0.000 (0.002) loss 0.8020 (1.1803) lr 4.1221e-04 eta 11:36:09
epoch [41/50] batch [640/2000] time 2.062 (2.152) data 0.000 (0.002) loss 2.1634 (1.1824) lr 4.1221e-04 eta 11:34:19
epoch [41/50] batch [660/2000] time 2.064 (2.148) data 0.000 (0.002) loss 0.1513 (1.1797) lr 4.1221e-04 eta 11:32:31
epoch [41/50] batch [680/2000] time 2.043 (2.145) data 0.000 (0.001) loss 1.9181 (1.1761) lr 4.1221e-04 eta 11:30:44
epoch [41/50] batch [700/2000] time 2.067 (2.142) data 0.000 (0.001) loss 0.4077 (1.1807) lr 4.1221e-04 eta 11:29:07
epoch [41/50] batch [720/2000] time 2.010 (2.140) data 0.000 (0.001) loss 1.9830 (1.1834) lr 4.1221e-04 eta 11:27:31
epoch [41/50] batch [740/2000] time 2.070 (2.137) data 0.000 (0.001) loss 0.1745 (1.1824) lr 4.1221e-04 eta 11:26:00
epoch [41/50] batch [760/2000] time 2.082 (2.135) data 0.000 (0.001) loss 2.2565 (1.1793) lr 4.1221e-04 eta 11:24:39
epoch [41/50] batch [780/2000] time 2.063 (2.133) data 0.000 (0.001) loss 1.1523 (1.1679) lr 4.1221e-04 eta 11:23:11
epoch [41/50] batch [800/2000] time 2.040 (2.131) data 0.000 (0.001) loss 2.2857 (1.1713) lr 4.1221e-04 eta 11:21:45
epoch [41/50] batch [820/2000] time 2.069 (2.128) data 0.000 (0.001) loss 0.7646 (1.1735) lr 4.1221e-04 eta 11:20:21
epoch [41/50] batch [840/2000] time 2.060 (2.126) data 0.000 (0.001) loss 1.1228 (1.1696) lr 4.1221e-04 eta 11:19:02
epoch [41/50] batch [860/2000] time 2.039 (2.124) data 0.000 (0.001) loss 1.8782 (1.1637) lr 4.1221e-04 eta 11:17:39
epoch [41/50] batch [880/2000] time 2.037 (2.122) data 0.000 (0.001) loss 0.0112 (1.1639) lr 4.1221e-04 eta 11:16:20
epoch [41/50] batch [900/2000] time 2.057 (2.121) data 0.000 (0.001) loss 2.2739 (1.1721) lr 4.1221e-04 eta 11:15:04
epoch [41/50] batch [920/2000] time 2.120 (2.119) data 0.001 (0.001) loss 0.4273 (1.1674) lr 4.1221e-04 eta 11:13:56
epoch [41/50] batch [940/2000] time 2.087 (2.119) data 0.001 (0.001) loss 0.4519 (1.1727) lr 4.1221e-04 eta 11:13:09
epoch [41/50] batch [960/2000] time 2.045 (2.118) data 0.001 (0.001) loss 0.5220 (1.1717) lr 4.1221e-04 eta 11:11:59
epoch [41/50] batch [980/2000] time 2.021 (2.117) data 0.001 (0.001) loss 1.2703 (1.1713) lr 4.1221e-04 eta 11:10:58
epoch [41/50] batch [1000/2000] time 2.053 (2.116) data 0.001 (0.001) loss 2.6660 (1.1753) lr 4.1221e-04 eta 11:09:57
epoch [41/50] batch [1020/2000] time 2.291 (2.116) data 0.002 (0.001) loss 0.8722 (1.1761) lr 4.1221e-04 eta 11:09:27
epoch [41/50] batch [1040/2000] time 2.017 (2.115) data 0.001 (0.001) loss 1.3569 (1.1740) lr 4.1221e-04 eta 11:08:26
epoch [41/50] batch [1060/2000] time 2.108 (2.114) data 0.000 (0.001) loss 1.2070 (1.1785) lr 4.1221e-04 eta 11:07:23
epoch [41/50] batch [1080/2000] time 2.062 (2.114) data 0.001 (0.001) loss 2.1385 (1.1816) lr 4.1221e-04 eta 11:06:27
epoch [41/50] batch [1100/2000] time 2.077 (2.113) data 0.000 (0.001) loss 1.0407 (1.1787) lr 4.1221e-04 eta 11:05:31
epoch [41/50] batch [1120/2000] time 2.065 (2.112) data 0.000 (0.001) loss 0.7473 (1.1723) lr 4.1221e-04 eta 11:04:27
epoch [41/50] batch [1140/2000] time 2.011 (2.110) data 0.001 (0.001) loss 2.6763 (1.1685) lr 4.1221e-04 eta 11:03:22
epoch [41/50] batch [1160/2000] time 2.068 (2.109) data 0.001 (0.001) loss 0.6089 (1.1653) lr 4.1221e-04 eta 11:02:21
epoch [41/50] batch [1180/2000] time 2.045 (2.108) data 0.000 (0.001) loss 0.2804 (1.1661) lr 4.1221e-04 eta 11:01:20
epoch [41/50] batch [1200/2000] time 2.011 (2.107) data 0.000 (0.001) loss 2.2707 (1.1640) lr 4.1221e-04 eta 11:00:15
epoch [41/50] batch [1220/2000] time 2.067 (2.106) data 0.000 (0.001) loss 1.5530 (1.1636) lr 4.1221e-04 eta 10:59:14
epoch [41/50] batch [1240/2000] time 2.011 (2.105) data 0.000 (0.001) loss 1.9453 (1.1570) lr 4.1221e-04 eta 10:58:14
epoch [41/50] batch [1260/2000] time 2.007 (2.104) data 0.000 (0.001) loss 1.5338 (1.1591) lr 4.1221e-04 eta 10:57:13
epoch [41/50] batch [1280/2000] time 2.068 (2.103) data 0.000 (0.001) loss 0.1687 (1.1589) lr 4.1221e-04 eta 10:56:12
epoch [41/50] batch [1300/2000] time 2.011 (2.102) data 0.000 (0.001) loss 2.4418 (1.1599) lr 4.1221e-04 eta 10:55:12
epoch [41/50] batch [1320/2000] time 2.012 (2.101) data 0.000 (0.001) loss 0.5956 (1.1583) lr 4.1221e-04 eta 10:54:14
epoch [41/50] batch [1340/2000] time 2.076 (2.101) data 0.000 (0.001) loss 0.2525 (1.1551) lr 4.1221e-04 eta 10:53:18
epoch [41/50] batch [1360/2000] time 2.014 (2.100) data 0.000 (0.001) loss 0.2885 (1.1550) lr 4.1221e-04 eta 10:52:22
epoch [41/50] batch [1380/2000] time 1.984 (2.099) data 0.000 (0.001) loss 2.0154 (1.1529) lr 4.1221e-04 eta 10:51:26
epoch [41/50] batch [1400/2000] time 2.076 (2.099) data 0.000 (0.001) loss 1.0908 (1.1550) lr 4.1221e-04 eta 10:50:32
epoch [41/50] batch [1420/2000] time 2.067 (2.098) data 0.000 (0.001) loss 1.6498 (1.1522) lr 4.1221e-04 eta 10:49:36
epoch [41/50] batch [1440/2000] time 2.058 (2.097) data 0.000 (0.001) loss 0.9589 (1.1496) lr 4.1221e-04 eta 10:48:37
epoch [41/50] batch [1460/2000] time 2.075 (2.096) data 0.000 (0.001) loss 0.0976 (1.1514) lr 4.1221e-04 eta 10:47:44
epoch [41/50] batch [1480/2000] time 1.992 (2.096) data 0.000 (0.001) loss 4.2817 (1.1543) lr 4.1221e-04 eta 10:46:51
epoch [41/50] batch [1500/2000] time 2.039 (2.095) data 0.000 (0.001) loss 1.9820 (1.1540) lr 4.1221e-04 eta 10:45:55
epoch [41/50] batch [1520/2000] time 2.063 (2.094) data 0.000 (0.001) loss 0.7947 (1.1500) lr 4.1221e-04 eta 10:45:00
epoch [41/50] batch [1540/2000] time 2.040 (2.093) data 0.000 (0.001) loss 0.2568 (1.1481) lr 4.1221e-04 eta 10:44:04
epoch [41/50] batch [1560/2000] time 2.038 (2.093) data 0.000 (0.001) loss 0.6916 (1.1510) lr 4.1221e-04 eta 10:43:12
epoch [41/50] batch [1580/2000] time 2.034 (2.092) data 0.000 (0.001) loss 1.1930 (1.1493) lr 4.1221e-04 eta 10:42:18
epoch [41/50] batch [1600/2000] time 2.062 (2.091) data 0.000 (0.001) loss 1.4941 (1.1487) lr 4.1221e-04 eta 10:41:23
epoch [41/50] batch [1620/2000] time 2.055 (2.091) data 0.000 (0.001) loss 0.2602 (1.1472) lr 4.1221e-04 eta 10:40:28
epoch [41/50] batch [1640/2000] time 2.061 (2.090) data 0.000 (0.001) loss 1.3816 (1.1475) lr 4.1221e-04 eta 10:39:36
epoch [41/50] batch [1660/2000] time 2.002 (2.090) data 0.000 (0.001) loss 2.4929 (1.1525) lr 4.1221e-04 eta 10:38:41
epoch [41/50] batch [1680/2000] time 2.038 (2.089) data 0.001 (0.001) loss 1.2151 (1.1502) lr 4.1221e-04 eta 10:37:49
epoch [41/50] batch [1700/2000] time 2.031 (2.088) data 0.000 (0.001) loss 3.0373 (1.1519) lr 4.1221e-04 eta 10:36:55
epoch [41/50] batch [1720/2000] time 2.004 (2.088) data 0.000 (0.001) loss 0.5181 (1.1494) lr 4.1221e-04 eta 10:36:02
epoch [41/50] batch [1740/2000] time 2.065 (2.087) data 0.001 (0.001) loss 1.2937 (1.1479) lr 4.1221e-04 eta 10:35:12
epoch [41/50] batch [1760/2000] time 2.080 (2.087) data 0.001 (0.001) loss 0.6313 (1.1475) lr 4.1221e-04 eta 10:34:20
epoch [41/50] batch [1780/2000] time 2.063 (2.086) data 0.000 (0.001) loss 2.8172 (1.1483) lr 4.1221e-04 eta 10:33:29
epoch [41/50] batch [1800/2000] time 2.005 (2.086) data 0.000 (0.001) loss 0.6739 (1.1452) lr 4.1221e-04 eta 10:32:37
epoch [41/50] batch [1820/2000] time 1.980 (2.085) data 0.000 (0.001) loss 0.4992 (1.1441) lr 4.1221e-04 eta 10:31:44
epoch [41/50] batch [1840/2000] time 2.060 (2.084) data 0.000 (0.001) loss 1.1876 (1.1449) lr 4.1221e-04 eta 10:30:51
epoch [41/50] batch [1860/2000] time 2.034 (2.084) data 0.000 (0.001) loss 0.5179 (1.1436) lr 4.1221e-04 eta 10:29:58
epoch [41/50] batch [1880/2000] time 2.004 (2.083) data 0.000 (0.001) loss 0.8569 (1.1453) lr 4.1221e-04 eta 10:29:07
epoch [41/50] batch [1900/2000] time 2.001 (2.083) data 0.000 (0.001) loss 0.0353 (1.1467) lr 4.1221e-04 eta 10:28:17
epoch [41/50] batch [1920/2000] time 2.046 (2.082) data 0.000 (0.001) loss 0.1927 (1.1500) lr 4.1221e-04 eta 10:27:27
epoch [41/50] batch [1940/2000] time 2.073 (2.082) data 0.000 (0.001) loss 1.3904 (1.1510) lr 4.1221e-04 eta 10:26:39
epoch [41/50] batch [1960/2000] time 2.068 (2.081) data 0.000 (0.001) loss 1.1030 (1.1495) lr 4.1221e-04 eta 10:25:50
epoch [41/50] batch [1980/2000] time 2.004 (2.081) data 0.000 (0.001) loss 0.1254 (1.1486) lr 4.1221e-04 eta 10:25:00
epoch [41/50] batch [2000/2000] time 2.080 (2.081) data 0.000 (0.001) loss 1.4547 (1.1477) lr 3.6258e-04 eta 10:24:09
epoch [42/50] batch [20/2000] time 2.069 (2.099) data 0.000 (0.055) loss 4.4463 (1.2139) lr 3.6258e-04 eta 10:28:53
epoch [42/50] batch [40/2000] time 2.069 (2.069) data 0.000 (0.028) loss 0.6634 (1.3321) lr 3.6258e-04 eta 10:19:14
epoch [42/50] batch [60/2000] time 2.068 (2.061) data 0.001 (0.018) loss 1.7825 (1.3464) lr 3.6258e-04 eta 10:16:21
epoch [42/50] batch [80/2000] time 2.010 (2.056) data 0.000 (0.014) loss 2.1251 (1.1829) lr 3.6258e-04 eta 10:14:07
epoch [42/50] batch [100/2000] time 2.063 (2.054) data 0.000 (0.011) loss 3.1112 (1.1900) lr 3.6258e-04 eta 10:12:41
epoch [42/50] batch [120/2000] time 2.003 (2.052) data 0.000 (0.009) loss 0.6058 (1.2017) lr 3.6258e-04 eta 10:11:24
epoch [42/50] batch [140/2000] time 2.047 (2.050) data 0.000 (0.008) loss 2.1881 (1.2020) lr 3.6258e-04 eta 10:10:10
epoch [42/50] batch [160/2000] time 2.014 (2.049) data 0.000 (0.007) loss 0.1686 (1.1845) lr 3.6258e-04 eta 10:09:05
epoch [42/50] batch [180/2000] time 2.068 (2.048) data 0.000 (0.006) loss 1.2551 (1.1950) lr 3.6258e-04 eta 10:08:22
epoch [42/50] batch [200/2000] time 2.016 (2.048) data 0.000 (0.006) loss 0.9275 (1.1981) lr 3.6258e-04 eta 10:07:34
epoch [42/50] batch [220/2000] time 2.068 (2.048) data 0.000 (0.005) loss 0.3020 (1.1664) lr 3.6258e-04 eta 10:06:48
epoch [42/50] batch [240/2000] time 2.069 (2.048) data 0.000 (0.005) loss 0.6634 (1.1361) lr 3.6258e-04 eta 10:06:08
epoch [42/50] batch [260/2000] time 2.070 (2.048) data 0.000 (0.004) loss 0.3697 (1.1272) lr 3.6258e-04 eta 10:05:33
epoch [42/50] batch [280/2000] time 2.008 (2.048) data 0.000 (0.004) loss 2.9690 (1.1173) lr 3.6258e-04 eta 10:04:59
epoch [42/50] batch [300/2000] time 2.061 (2.048) data 0.000 (0.004) loss 0.9473 (1.0940) lr 3.6258e-04 eta 10:04:03
epoch [42/50] batch [320/2000] time 2.064 (2.047) data 0.000 (0.004) loss 1.3274 (1.0916) lr 3.6258e-04 eta 10:03:05
epoch [42/50] batch [340/2000] time 2.062 (2.047) data 0.000 (0.003) loss 0.6056 (1.0953) lr 3.6258e-04 eta 10:02:21
epoch [42/50] batch [360/2000] time 2.063 (2.046) data 0.000 (0.003) loss 1.3250 (1.1150) lr 3.6258e-04 eta 10:01:39
epoch [42/50] batch [380/2000] time 2.067 (2.047) data 0.000 (0.003) loss 1.6364 (1.1351) lr 3.6258e-04 eta 10:01:02
epoch [42/50] batch [400/2000] time 2.064 (2.046) data 0.000 (0.003) loss 0.6221 (1.1311) lr 3.6258e-04 eta 10:00:15
epoch [42/50] batch [420/2000] time 1.985 (2.046) data 0.000 (0.003) loss 0.7735 (1.1440) lr 3.6258e-04 eta 9:59:28
epoch [42/50] batch [440/2000] time 2.008 (2.046) data 0.000 (0.003) loss 1.1271 (1.1473) lr 3.6258e-04 eta 9:58:45
epoch [42/50] batch [460/2000] time 2.005 (2.045) data 0.000 (0.003) loss 0.3990 (1.1537) lr 3.6258e-04 eta 9:57:56
epoch [42/50] batch [480/2000] time 2.061 (2.045) data 0.000 (0.003) loss 0.2756 (1.1440) lr 3.6258e-04 eta 9:57:12
epoch [42/50] batch [500/2000] time 2.038 (2.045) data 0.000 (0.002) loss 2.4380 (1.1601) lr 3.6258e-04 eta 9:56:27
epoch [42/50] batch [520/2000] time 2.012 (2.045) data 0.000 (0.002) loss 2.6365 (1.1534) lr 3.6258e-04 eta 9:55:43
epoch [42/50] batch [540/2000] time 2.054 (2.045) data 0.000 (0.002) loss 2.1250 (1.1566) lr 3.6258e-04 eta 9:54:59
epoch [42/50] batch [560/2000] time 2.046 (2.045) data 0.005 (0.002) loss 1.8747 (1.1615) lr 3.6258e-04 eta 9:54:23
epoch [42/50] batch [580/2000] time 2.015 (2.045) data 0.000 (0.002) loss 1.0774 (1.1698) lr 3.6258e-04 eta 9:53:42
epoch [42/50] batch [600/2000] time 2.006 (2.045) data 0.001 (0.002) loss 0.2302 (1.1580) lr 3.6258e-04 eta 9:53:05
epoch [42/50] batch [620/2000] time 2.043 (2.045) data 0.000 (0.002) loss 0.6401 (1.1478) lr 3.6258e-04 eta 9:52:23
epoch [42/50] batch [640/2000] time 2.012 (2.045) data 0.000 (0.002) loss 0.6772 (1.1443) lr 3.6258e-04 eta 9:51:40
epoch [42/50] batch [660/2000] time 2.043 (2.045) data 0.000 (0.002) loss 0.0755 (1.1333) lr 3.6258e-04 eta 9:51:01
epoch [42/50] batch [680/2000] time 2.072 (2.045) data 0.000 (0.002) loss 1.1340 (1.1226) lr 3.6258e-04 eta 9:50:23
epoch [42/50] batch [700/2000] time 2.063 (2.045) data 0.000 (0.002) loss 0.0744 (1.1305) lr 3.6258e-04 eta 9:49:38
epoch [42/50] batch [720/2000] time 2.066 (2.045) data 0.000 (0.002) loss 0.3529 (1.1290) lr 3.6258e-04 eta 9:48:53
epoch [42/50] batch [740/2000] time 2.008 (2.045) data 0.000 (0.002) loss 1.7040 (1.1305) lr 3.6258e-04 eta 9:48:09
epoch [42/50] batch [760/2000] time 2.064 (2.045) data 0.000 (0.002) loss 3.2796 (1.1322) lr 3.6258e-04 eta 9:47:30
epoch [42/50] batch [780/2000] time 2.065 (2.045) data 0.000 (0.002) loss 0.1230 (1.1240) lr 3.6258e-04 eta 9:46:47
epoch [42/50] batch [800/2000] time 2.008 (2.045) data 0.000 (0.002) loss 0.7520 (1.1243) lr 3.6258e-04 eta 9:46:06
epoch [42/50] batch [820/2000] time 2.058 (2.044) data 0.000 (0.002) loss 0.8815 (1.1200) lr 3.6258e-04 eta 9:45:23
epoch [42/50] batch [840/2000] time 2.041 (2.044) data 0.000 (0.002) loss 3.6369 (1.1171) lr 3.6258e-04 eta 9:44:37
epoch [42/50] batch [860/2000] time 2.007 (2.044) data 0.000 (0.002) loss 0.7991 (1.1183) lr 3.6258e-04 eta 9:43:58
epoch [42/50] batch [880/2000] time 2.004 (2.044) data 0.000 (0.002) loss 1.6054 (1.1183) lr 3.6258e-04 eta 9:43:16
epoch [42/50] batch [900/2000] time 2.022 (2.044) data 0.000 (0.002) loss 0.4848 (1.1189) lr 3.6258e-04 eta 9:42:35
epoch [42/50] batch [920/2000] time 2.062 (2.044) data 0.000 (0.001) loss 0.5026 (1.1198) lr 3.6258e-04 eta 9:41:53
epoch [42/50] batch [940/2000] time 2.060 (2.044) data 0.000 (0.001) loss 2.0028 (1.1235) lr 3.6258e-04 eta 9:41:11
epoch [42/50] batch [960/2000] time 2.057 (2.044) data 0.000 (0.001) loss 2.8458 (1.1241) lr 3.6258e-04 eta 9:40:24
epoch [42/50] batch [980/2000] time 2.002 (2.043) data 0.000 (0.001) loss 2.7202 (1.1258) lr 3.6258e-04 eta 9:39:39
epoch [42/50] batch [1000/2000] time 2.034 (2.043) data 0.000 (0.001) loss 0.2620 (1.1300) lr 3.6258e-04 eta 9:38:57
epoch [42/50] batch [1020/2000] time 2.059 (2.044) data 0.000 (0.001) loss 0.5439 (1.1353) lr 3.6258e-04 eta 9:38:18
epoch [42/50] batch [1040/2000] time 2.006 (2.043) data 0.000 (0.001) loss 0.4164 (1.1329) lr 3.6258e-04 eta 9:37:35
epoch [42/50] batch [1060/2000] time 2.010 (2.043) data 0.000 (0.001) loss 1.2756 (1.1218) lr 3.6258e-04 eta 9:36:54
epoch [42/50] batch [1080/2000] time 2.068 (2.043) data 0.000 (0.001) loss 0.9604 (1.1231) lr 3.6258e-04 eta 9:36:12
epoch [42/50] batch [1100/2000] time 2.041 (2.043) data 0.000 (0.001) loss 1.8196 (1.1181) lr 3.6258e-04 eta 9:35:28
epoch [42/50] batch [1120/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.2794 (1.1208) lr 3.6258e-04 eta 9:34:45
epoch [42/50] batch [1140/2000] time 2.068 (2.043) data 0.001 (0.001) loss 0.2828 (1.1245) lr 3.6258e-04 eta 9:34:05
epoch [42/50] batch [1160/2000] time 2.064 (2.043) data 0.000 (0.001) loss 1.2026 (1.1200) lr 3.6258e-04 eta 9:33:23
epoch [42/50] batch [1180/2000] time 2.068 (2.043) data 0.000 (0.001) loss 0.9031 (1.1146) lr 3.6258e-04 eta 9:32:41
epoch [42/50] batch [1200/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.8849 (1.1181) lr 3.6258e-04 eta 9:31:59
epoch [42/50] batch [1220/2000] time 2.007 (2.043) data 0.000 (0.001) loss 0.1031 (1.1214) lr 3.6258e-04 eta 9:31:17
epoch [42/50] batch [1240/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.6028 (1.1297) lr 3.6258e-04 eta 9:30:36
epoch [42/50] batch [1260/2000] time 2.065 (2.043) data 0.000 (0.001) loss 1.3371 (1.1303) lr 3.6258e-04 eta 9:29:57
epoch [42/50] batch [1280/2000] time 2.064 (2.043) data 0.000 (0.001) loss 0.9529 (1.1294) lr 3.6258e-04 eta 9:29:17
epoch [42/50] batch [1300/2000] time 2.084 (2.043) data 0.000 (0.001) loss 0.2406 (1.1299) lr 3.6258e-04 eta 9:28:37
epoch [42/50] batch [1320/2000] time 2.070 (2.043) data 0.000 (0.001) loss 0.1476 (1.1283) lr 3.6258e-04 eta 9:27:57
epoch [42/50] batch [1340/2000] time 2.014 (2.043) data 0.000 (0.001) loss 0.4083 (1.1274) lr 3.6258e-04 eta 9:27:19
epoch [42/50] batch [1360/2000] time 2.040 (2.043) data 0.000 (0.001) loss 2.2545 (1.1321) lr 3.6258e-04 eta 9:26:39
epoch [42/50] batch [1380/2000] time 2.010 (2.043) data 0.000 (0.001) loss 1.5490 (1.1311) lr 3.6258e-04 eta 9:25:57
epoch [42/50] batch [1400/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.6388 (1.1263) lr 3.6258e-04 eta 9:25:15
epoch [42/50] batch [1420/2000] time 2.010 (2.043) data 0.000 (0.001) loss 0.3477 (1.1253) lr 3.6258e-04 eta 9:24:33
epoch [42/50] batch [1440/2000] time 2.010 (2.043) data 0.000 (0.001) loss 2.0915 (1.1233) lr 3.6258e-04 eta 9:23:52
epoch [42/50] batch [1460/2000] time 2.043 (2.043) data 0.000 (0.001) loss 2.3397 (1.1184) lr 3.6258e-04 eta 9:23:12
epoch [42/50] batch [1480/2000] time 2.065 (2.043) data 0.000 (0.001) loss 0.1185 (1.1171) lr 3.6258e-04 eta 9:22:31
epoch [42/50] batch [1500/2000] time 2.064 (2.043) data 0.000 (0.001) loss 0.8222 (1.1157) lr 3.6258e-04 eta 9:21:49
epoch [42/50] batch [1520/2000] time 2.064 (2.043) data 0.000 (0.001) loss 0.3433 (1.1158) lr 3.6258e-04 eta 9:21:09
epoch [42/50] batch [1540/2000] time 2.063 (2.043) data 0.000 (0.001) loss 3.0362 (1.1147) lr 3.6258e-04 eta 9:20:28
epoch [42/50] batch [1560/2000] time 2.067 (2.043) data 0.000 (0.001) loss 1.0419 (1.1141) lr 3.6258e-04 eta 9:19:50
epoch [42/50] batch [1580/2000] time 2.075 (2.043) data 0.000 (0.001) loss 1.7512 (1.1162) lr 3.6258e-04 eta 9:19:09
epoch [42/50] batch [1600/2000] time 2.067 (2.043) data 0.000 (0.001) loss 0.0185 (1.1192) lr 3.6258e-04 eta 9:18:30
epoch [42/50] batch [1620/2000] time 2.066 (2.043) data 0.000 (0.001) loss 0.7470 (1.1191) lr 3.6258e-04 eta 9:17:51
epoch [42/50] batch [1640/2000] time 2.008 (2.043) data 0.000 (0.001) loss 1.1470 (1.1176) lr 3.6258e-04 eta 9:17:09
epoch [42/50] batch [1660/2000] time 2.047 (2.044) data 0.000 (0.001) loss 1.1499 (1.1198) lr 3.6258e-04 eta 9:16:31
epoch [42/50] batch [1680/2000] time 2.010 (2.044) data 0.001 (0.001) loss 1.7640 (1.1225) lr 3.6258e-04 eta 9:15:52
epoch [42/50] batch [1700/2000] time 2.066 (2.044) data 0.000 (0.001) loss 0.1598 (1.1237) lr 3.6258e-04 eta 9:15:12
epoch [42/50] batch [1720/2000] time 2.009 (2.044) data 0.000 (0.001) loss 0.2622 (1.1220) lr 3.6258e-04 eta 9:14:29
epoch [42/50] batch [1740/2000] time 2.042 (2.044) data 0.000 (0.001) loss 0.8191 (1.1227) lr 3.6258e-04 eta 9:13:48
epoch [42/50] batch [1760/2000] time 1.987 (2.043) data 0.000 (0.001) loss 0.7136 (1.1242) lr 3.6258e-04 eta 9:13:05
epoch [42/50] batch [1780/2000] time 2.042 (2.043) data 0.000 (0.001) loss 1.7942 (1.1227) lr 3.6258e-04 eta 9:12:23
epoch [42/50] batch [1800/2000] time 2.012 (2.043) data 0.000 (0.001) loss 0.7721 (1.1250) lr 3.6258e-04 eta 9:11:42
epoch [42/50] batch [1820/2000] time 2.065 (2.043) data 0.000 (0.001) loss 0.5550 (1.1275) lr 3.6258e-04 eta 9:11:00
epoch [42/50] batch [1840/2000] time 2.011 (2.043) data 0.000 (0.001) loss 0.4728 (1.1287) lr 3.6258e-04 eta 9:10:20
epoch [42/50] batch [1860/2000] time 2.046 (2.043) data 0.000 (0.001) loss 0.1494 (1.1284) lr 3.6258e-04 eta 9:09:40
epoch [42/50] batch [1880/2000] time 2.073 (2.043) data 0.000 (0.001) loss 0.8320 (1.1278) lr 3.6258e-04 eta 9:09:00
epoch [42/50] batch [1900/2000] time 2.043 (2.044) data 0.000 (0.001) loss 0.5271 (1.1276) lr 3.6258e-04 eta 9:08:21
epoch [42/50] batch [1920/2000] time 2.009 (2.044) data 0.000 (0.001) loss 0.9697 (1.1275) lr 3.6258e-04 eta 9:07:40
epoch [42/50] batch [1940/2000] time 2.010 (2.044) data 0.000 (0.001) loss 1.1839 (1.1306) lr 3.6258e-04 eta 9:06:59
epoch [42/50] batch [1960/2000] time 2.010 (2.044) data 0.000 (0.001) loss 0.9425 (1.1288) lr 3.6258e-04 eta 9:06:20
epoch [42/50] batch [1980/2000] time 2.067 (2.044) data 0.000 (0.001) loss 0.0865 (1.1315) lr 3.6258e-04 eta 9:05:41
epoch [42/50] batch [2000/2000] time 2.066 (2.044) data 0.000 (0.001) loss 0.2745 (1.1296) lr 3.1545e-04 eta 9:04:59
epoch [43/50] batch [20/2000] time 2.072 (2.078) data 0.001 (0.034) loss 0.6152 (0.6964) lr 3.1545e-04 eta 9:13:33
epoch [43/50] batch [40/2000] time 2.064 (2.062) data 0.000 (0.018) loss 0.3404 (1.1385) lr 3.1545e-04 eta 9:08:32
epoch [43/50] batch [60/2000] time 2.063 (2.055) data 0.001 (0.012) loss 0.8384 (1.1432) lr 3.1545e-04 eta 9:06:03
epoch [43/50] batch [80/2000] time 2.039 (2.053) data 0.000 (0.009) loss 1.2360 (1.1370) lr 3.1545e-04 eta 9:04:43
epoch [43/50] batch [100/2000] time 2.042 (2.051) data 0.000 (0.007) loss 0.9671 (1.1211) lr 3.1545e-04 eta 9:03:34
epoch [43/50] batch [120/2000] time 2.072 (2.050) data 0.000 (0.006) loss 2.4060 (1.1628) lr 3.1545e-04 eta 9:02:39
epoch [43/50] batch [140/2000] time 2.010 (2.049) data 0.000 (0.005) loss 1.4029 (1.1197) lr 3.1545e-04 eta 9:01:44
epoch [43/50] batch [160/2000] time 2.012 (2.049) data 0.000 (0.005) loss 1.4091 (1.1331) lr 3.1545e-04 eta 9:00:51
epoch [43/50] batch [180/2000] time 2.055 (2.048) data 0.000 (0.004) loss 1.8424 (1.1295) lr 3.1545e-04 eta 9:00:00
epoch [43/50] batch [200/2000] time 2.040 (2.048) data 0.000 (0.004) loss 2.4999 (1.1146) lr 3.1545e-04 eta 8:59:15
epoch [43/50] batch [220/2000] time 2.064 (2.048) data 0.000 (0.003) loss 0.6926 (1.1142) lr 3.1545e-04 eta 8:58:31
epoch [43/50] batch [240/2000] time 2.070 (2.047) data 0.000 (0.003) loss 0.9408 (1.0991) lr 3.1545e-04 eta 8:57:39
epoch [43/50] batch [260/2000] time 2.013 (2.046) data 0.000 (0.003) loss 1.7882 (1.1157) lr 3.1545e-04 eta 8:56:51
epoch [43/50] batch [280/2000] time 2.065 (2.047) data 0.000 (0.003) loss 0.3899 (1.1176) lr 3.1545e-04 eta 8:56:11
epoch [43/50] batch [300/2000] time 2.040 (2.046) data 0.000 (0.003) loss 1.4998 (1.1286) lr 3.1545e-04 eta 8:55:20
epoch [43/50] batch [320/2000] time 2.044 (2.046) data 0.000 (0.002) loss 0.0788 (1.1217) lr 3.1545e-04 eta 8:54:34
epoch [43/50] batch [340/2000] time 2.043 (2.045) data 0.000 (0.002) loss 0.2714 (1.1011) lr 3.1545e-04 eta 8:53:44
epoch [43/50] batch [360/2000] time 2.044 (2.045) data 0.000 (0.002) loss 3.1748 (1.1169) lr 3.1545e-04 eta 8:52:58
epoch [43/50] batch [380/2000] time 2.065 (2.045) data 0.000 (0.002) loss 0.3460 (1.1139) lr 3.1545e-04 eta 8:52:20
epoch [43/50] batch [400/2000] time 2.066 (2.045) data 0.000 (0.002) loss 0.8041 (1.1035) lr 3.1545e-04 eta 8:51:35
epoch [43/50] batch [420/2000] time 2.069 (2.045) data 0.000 (0.002) loss 0.7969 (1.1006) lr 3.1545e-04 eta 8:50:54
epoch [43/50] batch [440/2000] time 2.068 (2.045) data 0.000 (0.002) loss 3.3974 (1.1109) lr 3.1545e-04 eta 8:50:17
epoch [43/50] batch [460/2000] time 2.072 (2.045) data 0.000 (0.002) loss 1.8590 (1.1156) lr 3.1545e-04 eta 8:49:35
epoch [43/50] batch [480/2000] time 2.069 (2.045) data 0.000 (0.002) loss 0.0468 (1.1205) lr 3.1545e-04 eta 8:48:59
epoch [43/50] batch [500/2000] time 2.064 (2.045) data 0.000 (0.002) loss 3.2592 (1.1425) lr 3.1545e-04 eta 8:48:19
epoch [43/50] batch [520/2000] time 2.047 (2.045) data 0.004 (0.002) loss 0.9934 (1.1348) lr 3.1545e-04 eta 8:47:39
epoch [43/50] batch [540/2000] time 2.044 (2.045) data 0.000 (0.002) loss 1.6047 (1.1306) lr 3.1545e-04 eta 8:46:53
epoch [43/50] batch [560/2000] time 2.066 (2.045) data 0.000 (0.002) loss 0.3204 (1.1251) lr 3.1545e-04 eta 8:46:11
epoch [43/50] batch [580/2000] time 2.069 (2.045) data 0.000 (0.001) loss 0.1108 (1.1290) lr 3.1545e-04 eta 8:45:32
epoch [43/50] batch [600/2000] time 1.985 (2.045) data 0.001 (0.001) loss 1.3897 (1.1206) lr 3.1545e-04 eta 8:44:47
epoch [43/50] batch [620/2000] time 2.042 (2.045) data 0.000 (0.001) loss 1.4246 (1.1213) lr 3.1545e-04 eta 8:44:08
epoch [43/50] batch [640/2000] time 2.065 (2.044) data 0.000 (0.001) loss 0.7636 (1.1220) lr 3.1545e-04 eta 8:43:22
epoch [43/50] batch [660/2000] time 2.046 (2.044) data 0.000 (0.001) loss 1.1097 (1.1274) lr 3.1545e-04 eta 8:42:39
epoch [43/50] batch [680/2000] time 2.069 (2.044) data 0.000 (0.001) loss 1.0504 (1.1260) lr 3.1545e-04 eta 8:41:59
epoch [43/50] batch [700/2000] time 2.067 (2.044) data 0.000 (0.001) loss 2.0369 (1.1276) lr 3.1545e-04 eta 8:41:20
epoch [43/50] batch [720/2000] time 2.012 (2.044) data 0.000 (0.001) loss 0.1290 (1.1227) lr 3.1545e-04 eta 8:40:37
epoch [43/50] batch [740/2000] time 2.007 (2.044) data 0.000 (0.001) loss 3.8851 (1.1259) lr 3.1545e-04 eta 8:39:54
epoch [43/50] batch [760/2000] time 2.051 (2.044) data 0.000 (0.001) loss 1.3087 (1.1255) lr 3.1545e-04 eta 8:39:11
epoch [43/50] batch [780/2000] time 2.013 (2.044) data 0.000 (0.001) loss 0.6527 (1.1199) lr 3.1545e-04 eta 8:38:31
epoch [43/50] batch [800/2000] time 2.008 (2.044) data 0.000 (0.001) loss 1.1086 (1.1170) lr 3.1545e-04 eta 8:37:51
epoch [43/50] batch [820/2000] time 2.065 (2.044) data 0.000 (0.001) loss 0.1007 (1.1122) lr 3.1545e-04 eta 8:37:09
epoch [43/50] batch [840/2000] time 2.009 (2.044) data 0.000 (0.001) loss 1.2790 (1.1092) lr 3.1545e-04 eta 8:36:27
epoch [43/50] batch [860/2000] time 2.068 (2.044) data 0.000 (0.001) loss 0.5356 (1.1081) lr 3.1545e-04 eta 8:35:48
epoch [43/50] batch [880/2000] time 2.010 (2.044) data 0.000 (0.001) loss 0.5112 (1.1071) lr 3.1545e-04 eta 8:35:07
epoch [43/50] batch [900/2000] time 2.066 (2.044) data 0.000 (0.001) loss 0.4361 (1.1131) lr 3.1545e-04 eta 8:34:27
epoch [43/50] batch [920/2000] time 2.012 (2.044) data 0.000 (0.001) loss 0.5968 (1.1213) lr 3.1545e-04 eta 8:33:46
epoch [43/50] batch [940/2000] time 2.062 (2.044) data 0.000 (0.001) loss 4.2608 (1.1233) lr 3.1545e-04 eta 8:33:05
epoch [43/50] batch [960/2000] time 2.067 (2.044) data 0.000 (0.001) loss 0.3382 (1.1197) lr 3.1545e-04 eta 8:32:23
epoch [43/50] batch [980/2000] time 2.070 (2.044) data 0.000 (0.001) loss 0.8202 (1.1137) lr 3.1545e-04 eta 8:31:42
epoch [43/50] batch [1000/2000] time 2.082 (2.044) data 0.000 (0.001) loss 1.0410 (1.1106) lr 3.1545e-04 eta 8:31:01
epoch [43/50] batch [1020/2000] time 2.006 (2.044) data 0.000 (0.001) loss 0.1950 (1.1080) lr 3.1545e-04 eta 8:30:19
epoch [43/50] batch [1040/2000] time 2.066 (2.044) data 0.000 (0.001) loss 0.8150 (1.1063) lr 3.1545e-04 eta 8:29:37
epoch [43/50] batch [1060/2000] time 2.069 (2.044) data 0.001 (0.001) loss 0.3154 (1.1066) lr 3.1545e-04 eta 8:28:57
epoch [43/50] batch [1080/2000] time 2.040 (2.044) data 0.000 (0.001) loss 0.8087 (1.1046) lr 3.1545e-04 eta 8:28:16
epoch [43/50] batch [1100/2000] time 2.041 (2.044) data 0.000 (0.001) loss 0.9603 (1.1159) lr 3.1545e-04 eta 8:27:36
epoch [43/50] batch [1120/2000] time 2.044 (2.044) data 0.000 (0.001) loss 0.4530 (1.1111) lr 3.1545e-04 eta 8:26:56
epoch [43/50] batch [1140/2000] time 2.066 (2.044) data 0.001 (0.001) loss 1.8835 (1.1151) lr 3.1545e-04 eta 8:26:15
epoch [43/50] batch [1160/2000] time 2.067 (2.044) data 0.000 (0.001) loss 2.2128 (1.1160) lr 3.1545e-04 eta 8:25:34
epoch [43/50] batch [1180/2000] time 1.984 (2.044) data 0.000 (0.001) loss 0.1406 (1.1170) lr 3.1545e-04 eta 8:24:52
epoch [43/50] batch [1200/2000] time 2.067 (2.044) data 0.000 (0.001) loss 1.2409 (1.1190) lr 3.1545e-04 eta 8:24:12
epoch [43/50] batch [1220/2000] time 2.069 (2.044) data 0.000 (0.001) loss 0.5477 (1.1262) lr 3.1545e-04 eta 8:23:32
epoch [43/50] batch [1240/2000] time 2.045 (2.044) data 0.000 (0.001) loss 0.4667 (1.1307) lr 3.1545e-04 eta 8:22:53
epoch [43/50] batch [1260/2000] time 1.985 (2.044) data 0.000 (0.001) loss 1.4407 (1.1327) lr 3.1545e-04 eta 8:22:12
epoch [43/50] batch [1280/2000] time 2.016 (2.044) data 0.000 (0.001) loss 0.3222 (1.1340) lr 3.1545e-04 eta 8:21:30
epoch [43/50] batch [1300/2000] time 2.068 (2.044) data 0.000 (0.001) loss 0.3054 (1.1294) lr 3.1545e-04 eta 8:20:48
epoch [43/50] batch [1320/2000] time 2.015 (2.044) data 0.000 (0.001) loss 0.0859 (1.1264) lr 3.1545e-04 eta 8:20:06
epoch [43/50] batch [1340/2000] time 2.068 (2.044) data 0.000 (0.001) loss 0.9370 (1.1283) lr 3.1545e-04 eta 8:19:24
epoch [43/50] batch [1360/2000] time 2.068 (2.044) data 0.000 (0.001) loss 2.2402 (1.1328) lr 3.1545e-04 eta 8:18:43
epoch [43/50] batch [1380/2000] time 2.008 (2.044) data 0.000 (0.001) loss 2.1432 (1.1311) lr 3.1545e-04 eta 8:18:04
epoch [43/50] batch [1400/2000] time 2.009 (2.044) data 0.000 (0.001) loss 0.7660 (1.1309) lr 3.1545e-04 eta 8:17:22
epoch [43/50] batch [1420/2000] time 2.067 (2.044) data 0.000 (0.001) loss 1.2401 (1.1362) lr 3.1545e-04 eta 8:16:42
epoch [43/50] batch [1440/2000] time 2.065 (2.044) data 0.000 (0.001) loss 1.6717 (1.1313) lr 3.1545e-04 eta 8:15:59
epoch [43/50] batch [1460/2000] time 2.011 (2.044) data 0.000 (0.001) loss 3.1727 (1.1310) lr 3.1545e-04 eta 8:15:17
epoch [43/50] batch [1480/2000] time 2.010 (2.044) data 0.000 (0.001) loss 0.9973 (1.1301) lr 3.1545e-04 eta 8:14:38
epoch [43/50] batch [1500/2000] time 2.042 (2.044) data 0.000 (0.001) loss 1.1576 (1.1332) lr 3.1545e-04 eta 8:13:56
epoch [43/50] batch [1520/2000] time 2.050 (2.044) data 0.000 (0.001) loss 0.3496 (1.1362) lr 3.1545e-04 eta 8:13:14
epoch [43/50] batch [1540/2000] time 2.041 (2.044) data 0.000 (0.001) loss 0.5508 (1.1371) lr 3.1545e-04 eta 8:12:34
epoch [43/50] batch [1560/2000] time 2.068 (2.044) data 0.000 (0.001) loss 1.4287 (1.1355) lr 3.1545e-04 eta 8:11:52
epoch [43/50] batch [1580/2000] time 2.044 (2.044) data 0.000 (0.001) loss 1.3130 (1.1355) lr 3.1545e-04 eta 8:11:11
epoch [43/50] batch [1600/2000] time 2.018 (2.044) data 0.000 (0.001) loss 2.3914 (1.1387) lr 3.1545e-04 eta 8:10:28
epoch [43/50] batch [1620/2000] time 2.045 (2.044) data 0.000 (0.001) loss 0.3057 (1.1410) lr 3.1545e-04 eta 8:09:47
epoch [43/50] batch [1640/2000] time 2.021 (2.044) data 0.013 (0.001) loss 0.2925 (1.1414) lr 3.1545e-04 eta 8:09:06
epoch [43/50] batch [1660/2000] time 2.069 (2.044) data 0.000 (0.001) loss 0.0861 (1.1398) lr 3.1545e-04 eta 8:08:27
epoch [43/50] batch [1680/2000] time 2.040 (2.044) data 0.001 (0.001) loss 2.2025 (1.1411) lr 3.1545e-04 eta 8:07:45
epoch [43/50] batch [1700/2000] time 2.065 (2.044) data 0.000 (0.001) loss 1.7831 (1.1423) lr 3.1545e-04 eta 8:07:05
epoch [43/50] batch [1720/2000] time 1.985 (2.044) data 0.000 (0.001) loss 0.3479 (1.1393) lr 3.1545e-04 eta 8:06:23
epoch [43/50] batch [1740/2000] time 2.041 (2.044) data 0.000 (0.001) loss 0.3249 (1.1374) lr 3.1545e-04 eta 8:05:40
epoch [43/50] batch [1760/2000] time 2.069 (2.044) data 0.000 (0.001) loss 1.7822 (1.1380) lr 3.1545e-04 eta 8:05:01
epoch [43/50] batch [1780/2000] time 2.035 (2.044) data 0.000 (0.001) loss 0.3939 (1.1370) lr 3.1545e-04 eta 8:04:20
epoch [43/50] batch [1800/2000] time 2.013 (2.044) data 0.000 (0.001) loss 1.6109 (1.1363) lr 3.1545e-04 eta 8:03:38
epoch [43/50] batch [1820/2000] time 2.038 (2.043) data 0.000 (0.001) loss 2.4018 (1.1358) lr 3.1545e-04 eta 8:02:56
epoch [43/50] batch [1840/2000] time 2.008 (2.044) data 0.000 (0.001) loss 1.4758 (1.1370) lr 3.1545e-04 eta 8:02:16
epoch [43/50] batch [1860/2000] time 2.039 (2.044) data 0.000 (0.001) loss 1.0350 (1.1361) lr 3.1545e-04 eta 8:01:35
epoch [43/50] batch [1880/2000] time 2.066 (2.044) data 0.000 (0.001) loss 3.3905 (1.1394) lr 3.1545e-04 eta 8:00:55
epoch [43/50] batch [1900/2000] time 2.068 (2.044) data 0.000 (0.001) loss 1.3679 (1.1388) lr 3.1545e-04 eta 8:00:13
epoch [43/50] batch [1920/2000] time 2.068 (2.044) data 0.000 (0.001) loss 4.0567 (1.1400) lr 3.1545e-04 eta 7:59:33
epoch [43/50] batch [1940/2000] time 2.007 (2.044) data 0.000 (0.001) loss 0.4360 (1.1414) lr 3.1545e-04 eta 7:58:52
epoch [43/50] batch [1960/2000] time 2.075 (2.044) data 0.000 (0.001) loss 3.2167 (1.1420) lr 3.1545e-04 eta 7:58:11
epoch [43/50] batch [1980/2000] time 2.061 (2.044) data 0.000 (0.001) loss 0.6362 (1.1431) lr 3.1545e-04 eta 7:57:30
epoch [43/50] batch [2000/2000] time 2.005 (2.043) data 0.000 (0.001) loss 0.5974 (1.1410) lr 2.7103e-04 eta 7:56:48
epoch [44/50] batch [20/2000] time 2.058 (2.068) data 0.000 (0.029) loss 0.1307 (1.1537) lr 2.7103e-04 eta 8:01:57
epoch [44/50] batch [40/2000] time 2.008 (2.049) data 0.000 (0.015) loss 0.6916 (1.0963) lr 2.7103e-04 eta 7:56:48
epoch [44/50] batch [60/2000] time 2.060 (2.046) data 0.001 (0.010) loss 0.0574 (1.0526) lr 2.7103e-04 eta 7:55:19
epoch [44/50] batch [80/2000] time 2.015 (2.044) data 0.000 (0.007) loss 0.7069 (1.0473) lr 2.7103e-04 eta 7:54:17
epoch [44/50] batch [100/2000] time 2.036 (2.045) data 0.000 (0.006) loss 0.4717 (1.0815) lr 2.7103e-04 eta 7:53:40
epoch [44/50] batch [120/2000] time 2.060 (2.043) data 0.000 (0.005) loss 0.7525 (1.0372) lr 2.7103e-04 eta 7:52:40
epoch [44/50] batch [140/2000] time 2.058 (2.043) data 0.000 (0.004) loss 2.5821 (1.0577) lr 2.7103e-04 eta 7:51:50
epoch [44/50] batch [160/2000] time 2.044 (2.042) data 0.000 (0.004) loss 0.7896 (1.1122) lr 2.7103e-04 eta 7:50:58
epoch [44/50] batch [180/2000] time 2.163 (2.056) data 0.000 (0.003) loss 0.5065 (1.1078) lr 2.7103e-04 eta 7:53:38
epoch [44/50] batch [200/2000] time 2.510 (2.080) data 0.000 (0.003) loss 1.4419 (1.1711) lr 2.7103e-04 eta 7:58:22
epoch [44/50] batch [220/2000] time 2.168 (2.098) data 0.000 (0.003) loss 1.7853 (1.1600) lr 2.7103e-04 eta 8:01:51
epoch [44/50] batch [240/2000] time 2.581 (2.114) data 0.001 (0.003) loss 0.4409 (1.1555) lr 2.7103e-04 eta 8:04:46
epoch [44/50] batch [260/2000] time 2.224 (2.127) data 0.000 (0.003) loss 1.0252 (1.1213) lr 2.7103e-04 eta 8:07:06
epoch [44/50] batch [280/2000] time 2.258 (2.139) data 0.000 (0.002) loss 1.3151 (1.1186) lr 2.7103e-04 eta 8:09:01
epoch [44/50] batch [300/2000] time 2.575 (2.149) data 0.000 (0.002) loss 1.3549 (1.1350) lr 2.7103e-04 eta 8:10:39
epoch [44/50] batch [320/2000] time 2.206 (2.159) data 0.000 (0.002) loss 3.0211 (1.1279) lr 2.7103e-04 eta 8:12:13
epoch [44/50] batch [340/2000] time 2.212 (2.168) data 0.000 (0.002) loss 1.7172 (1.1354) lr 2.7103e-04 eta 8:13:40
epoch [44/50] batch [360/2000] time 2.354 (2.176) data 0.000 (0.002) loss 1.3788 (1.1566) lr 2.7103e-04 eta 8:14:44
epoch [44/50] batch [380/2000] time 2.522 (2.182) data 0.000 (0.002) loss 0.2794 (1.1435) lr 2.7103e-04 eta 8:15:21
epoch [44/50] batch [400/2000] time 2.177 (2.188) data 0.000 (0.002) loss 1.6720 (1.1367) lr 2.7103e-04 eta 8:15:56
epoch [44/50] batch [420/2000] time 2.152 (2.194) data 0.000 (0.002) loss 1.8984 (1.1395) lr 2.7103e-04 eta 8:16:33
epoch [44/50] batch [440/2000] time 2.532 (2.200) data 0.000 (0.002) loss 0.2232 (1.1307) lr 2.7103e-04 eta 8:17:05
epoch [44/50] batch [460/2000] time 2.063 (2.194) data 0.000 (0.002) loss 1.7426 (1.1276) lr 2.7103e-04 eta 8:15:00
epoch [44/50] batch [480/2000] time 2.061 (2.187) data 0.000 (0.001) loss 0.4070 (1.1389) lr 2.7103e-04 eta 8:12:52
epoch [44/50] batch [500/2000] time 2.014 (2.182) data 0.000 (0.001) loss 1.7316 (1.1358) lr 2.7103e-04 eta 8:10:51
epoch [44/50] batch [520/2000] time 2.039 (2.176) data 0.000 (0.001) loss 0.5516 (1.1276) lr 2.7103e-04 eta 8:08:56
epoch [44/50] batch [540/2000] time 2.010 (2.171) data 0.000 (0.001) loss 0.8270 (1.1224) lr 2.7103e-04 eta 8:07:04
epoch [44/50] batch [560/2000] time 2.062 (2.166) data 0.000 (0.001) loss 2.0055 (1.1305) lr 2.7103e-04 eta 8:05:17
epoch [44/50] batch [580/2000] time 2.061 (2.162) data 0.000 (0.001) loss 1.2670 (1.1329) lr 2.7103e-04 eta 8:03:36
epoch [44/50] batch [600/2000] time 2.061 (2.158) data 0.001 (0.001) loss 1.7564 (1.1293) lr 2.7103e-04 eta 8:01:57
epoch [44/50] batch [620/2000] time 2.039 (2.154) data 0.000 (0.001) loss 0.1820 (1.1339) lr 2.7103e-04 eta 8:00:26
epoch [44/50] batch [640/2000] time 2.009 (2.151) data 0.000 (0.001) loss 0.1029 (1.1259) lr 2.7103e-04 eta 7:58:57
epoch [44/50] batch [660/2000] time 2.063 (2.148) data 0.000 (0.001) loss 0.2633 (1.1274) lr 2.7103e-04 eta 7:57:31
epoch [44/50] batch [680/2000] time 2.012 (2.145) data 0.000 (0.001) loss 3.5464 (1.1285) lr 2.7103e-04 eta 7:56:08
epoch [44/50] batch [700/2000] time 2.043 (2.142) data 0.000 (0.001) loss 0.1634 (1.1249) lr 2.7103e-04 eta 7:54:45
epoch [44/50] batch [720/2000] time 2.063 (2.139) data 0.000 (0.001) loss 0.8384 (1.1312) lr 2.7103e-04 eta 7:53:24
epoch [44/50] batch [740/2000] time 2.045 (2.136) data 0.000 (0.001) loss 1.0113 (1.1403) lr 2.7103e-04 eta 7:52:05
epoch [44/50] batch [760/2000] time 2.063 (2.133) data 0.000 (0.001) loss 1.9115 (1.1423) lr 2.7103e-04 eta 7:50:45
epoch [44/50] batch [780/2000] time 1.987 (2.131) data 0.000 (0.001) loss 2.5283 (1.1419) lr 2.7103e-04 eta 7:49:31
epoch [44/50] batch [800/2000] time 2.081 (2.129) data 0.005 (0.001) loss 1.3767 (1.1415) lr 2.7103e-04 eta 7:48:24
epoch [44/50] batch [820/2000] time 2.066 (2.127) data 0.000 (0.001) loss 2.7542 (1.1405) lr 2.7103e-04 eta 7:47:13
epoch [44/50] batch [840/2000] time 2.046 (2.125) data 0.000 (0.001) loss 0.7349 (1.1411) lr 2.7103e-04 eta 7:46:05
epoch [44/50] batch [860/2000] time 1.986 (2.123) data 0.000 (0.001) loss 0.5244 (1.1406) lr 2.7103e-04 eta 7:44:55
epoch [44/50] batch [880/2000] time 2.013 (2.121) data 0.000 (0.001) loss 0.8533 (1.1354) lr 2.7103e-04 eta 7:43:51
epoch [44/50] batch [900/2000] time 2.010 (2.120) data 0.001 (0.001) loss 1.2446 (1.1302) lr 2.7103e-04 eta 7:42:46
epoch [44/50] batch [920/2000] time 2.066 (2.118) data 0.000 (0.001) loss 0.6110 (1.1332) lr 2.7103e-04 eta 7:41:44
epoch [44/50] batch [940/2000] time 2.067 (2.117) data 0.000 (0.001) loss 1.9547 (1.1253) lr 2.7103e-04 eta 7:40:42
epoch [44/50] batch [960/2000] time 2.280 (2.117) data 0.000 (0.001) loss 0.1597 (1.1295) lr 2.7103e-04 eta 7:40:02
epoch [44/50] batch [980/2000] time 2.205 (2.120) data 0.000 (0.001) loss 1.3002 (1.1199) lr 2.7103e-04 eta 7:40:08
epoch [44/50] batch [1000/2000] time 2.434 (2.124) data 0.000 (0.001) loss 1.9986 (1.1300) lr 2.7103e-04 eta 7:40:12
epoch [44/50] batch [1020/2000] time 2.183 (2.127) data 0.000 (0.001) loss 0.9245 (1.1291) lr 2.7103e-04 eta 7:40:07
epoch [44/50] batch [1040/2000] time 2.180 (2.131) data 0.000 (0.001) loss 0.1030 (1.1240) lr 2.7103e-04 eta 7:40:12
epoch [44/50] batch [1060/2000] time 2.535 (2.134) data 0.000 (0.001) loss 0.5957 (1.1263) lr 2.7103e-04 eta 7:40:13
epoch [44/50] batch [1080/2000] time 2.179 (2.137) data 0.005 (0.001) loss 1.5578 (1.1264) lr 2.7103e-04 eta 7:40:08
epoch [44/50] batch [1100/2000] time 2.175 (2.140) data 0.000 (0.001) loss 0.9560 (1.1276) lr 2.7103e-04 eta 7:40:06
epoch [44/50] batch [1120/2000] time 2.607 (2.143) data 0.000 (0.001) loss 2.5758 (1.1361) lr 2.7103e-04 eta 7:40:05
epoch [44/50] batch [1140/2000] time 2.327 (2.146) data 0.001 (0.001) loss 2.2880 (1.1357) lr 2.7103e-04 eta 7:39:57
epoch [44/50] batch [1160/2000] time 2.183 (2.149) data 0.000 (0.001) loss 2.1591 (1.1352) lr 2.7103e-04 eta 7:39:49
epoch [44/50] batch [1180/2000] time 2.198 (2.151) data 0.000 (0.001) loss 0.4634 (1.1372) lr 2.7103e-04 eta 7:39:42
epoch [44/50] batch [1200/2000] time 2.505 (2.154) data 0.000 (0.001) loss 0.9923 (1.1359) lr 2.7103e-04 eta 7:39:30
epoch [44/50] batch [1220/2000] time 2.166 (2.156) data 0.000 (0.001) loss 0.1687 (1.1325) lr 2.7103e-04 eta 7:39:18
epoch [44/50] batch [1240/2000] time 2.069 (2.156) data 0.000 (0.001) loss 0.0968 (1.1274) lr 2.7103e-04 eta 7:38:27
epoch [44/50] batch [1260/2000] time 2.073 (2.154) data 0.000 (0.001) loss 0.2578 (1.1246) lr 2.7103e-04 eta 7:37:21
epoch [44/50] batch [1280/2000] time 2.044 (2.152) data 0.000 (0.001) loss 0.3163 (1.1253) lr 2.7103e-04 eta 7:36:16
epoch [44/50] batch [1300/2000] time 2.072 (2.151) data 0.000 (0.001) loss 0.7568 (1.1249) lr 2.7103e-04 eta 7:35:11
epoch [44/50] batch [1320/2000] time 2.013 (2.149) data 0.000 (0.001) loss 1.8119 (1.1239) lr 2.7103e-04 eta 7:34:07
epoch [44/50] batch [1340/2000] time 2.069 (2.147) data 0.000 (0.001) loss 4.4574 (1.1285) lr 2.7103e-04 eta 7:33:03
epoch [44/50] batch [1360/2000] time 2.015 (2.146) data 0.001 (0.001) loss 2.6941 (1.1313) lr 2.7103e-04 eta 7:32:02
epoch [44/50] batch [1380/2000] time 2.019 (2.144) data 0.000 (0.001) loss 0.7426 (1.1332) lr 2.7103e-04 eta 7:31:00
epoch [44/50] batch [1400/2000] time 2.071 (2.143) data 0.000 (0.001) loss 0.5035 (1.1350) lr 2.7103e-04 eta 7:29:59
epoch [44/50] batch [1420/2000] time 2.067 (2.141) data 0.000 (0.001) loss 0.3475 (1.1345) lr 2.7103e-04 eta 7:28:59
epoch [44/50] batch [1440/2000] time 2.043 (2.140) data 0.000 (0.001) loss 0.1530 (1.1316) lr 2.7103e-04 eta 7:28:00
epoch [44/50] batch [1460/2000] time 2.067 (2.139) data 0.000 (0.001) loss 1.4060 (1.1303) lr 2.7103e-04 eta 7:27:00
epoch [44/50] batch [1480/2000] time 2.067 (2.138) data 0.000 (0.001) loss 0.4260 (1.1334) lr 2.7103e-04 eta 7:26:02
epoch [44/50] batch [1500/2000] time 2.067 (2.136) data 0.000 (0.001) loss 1.7799 (1.1326) lr 2.7103e-04 eta 7:25:04
epoch [44/50] batch [1520/2000] time 2.014 (2.135) data 0.000 (0.001) loss 0.0661 (1.1314) lr 2.7103e-04 eta 7:24:06
epoch [44/50] batch [1540/2000] time 2.010 (2.134) data 0.000 (0.001) loss 0.8741 (1.1313) lr 2.7103e-04 eta 7:23:07
epoch [44/50] batch [1560/2000] time 2.013 (2.133) data 0.000 (0.001) loss 1.0390 (1.1361) lr 2.7103e-04 eta 7:22:10
epoch [44/50] batch [1580/2000] time 2.020 (2.132) data 0.000 (0.001) loss 1.8095 (1.1343) lr 2.7103e-04 eta 7:21:13
epoch [44/50] batch [1600/2000] time 2.011 (2.130) data 0.000 (0.001) loss 0.2112 (1.1309) lr 2.7103e-04 eta 7:20:18
epoch [44/50] batch [1620/2000] time 2.161 (2.131) data 0.000 (0.001) loss 0.0696 (1.1319) lr 2.7103e-04 eta 7:19:43
epoch [44/50] batch [1640/2000] time 2.164 (2.134) data 0.000 (0.001) loss 3.8708 (1.1363) lr 2.7103e-04 eta 7:19:30
epoch [44/50] batch [1660/2000] time 2.337 (2.135) data 0.000 (0.001) loss 0.2502 (1.1356) lr 2.7103e-04 eta 7:19:08
epoch [44/50] batch [1680/2000] time 2.174 (2.137) data 0.001 (0.001) loss 0.6842 (1.1365) lr 2.7103e-04 eta 7:18:48
epoch [44/50] batch [1700/2000] time 2.332 (2.139) data 0.000 (0.001) loss 0.5966 (1.1367) lr 2.7103e-04 eta 7:18:33
epoch [44/50] batch [1720/2000] time 2.469 (2.141) data 0.000 (0.001) loss 1.3009 (1.1371) lr 2.7103e-04 eta 7:18:11
epoch [44/50] batch [1740/2000] time 2.200 (2.143) data 0.000 (0.001) loss 1.0781 (1.1352) lr 2.7103e-04 eta 7:17:50
epoch [44/50] batch [1760/2000] time 2.154 (2.145) data 0.000 (0.001) loss 2.8501 (1.1379) lr 2.7103e-04 eta 7:17:31
epoch [44/50] batch [1780/2000] time 2.548 (2.147) data 0.000 (0.001) loss 0.3733 (1.1383) lr 2.7103e-04 eta 7:17:12
epoch [44/50] batch [1800/2000] time 2.168 (2.148) data 0.000 (0.001) loss 0.2426 (1.1364) lr 2.7103e-04 eta 7:16:49
epoch [44/50] batch [1820/2000] time 2.206 (2.150) data 0.000 (0.001) loss 0.1009 (1.1393) lr 2.7103e-04 eta 7:16:30
epoch [44/50] batch [1840/2000] time 2.206 (2.152) data 0.000 (0.001) loss 0.5825 (1.1396) lr 2.7103e-04 eta 7:16:11
epoch [44/50] batch [1860/2000] time 2.448 (2.154) data 0.000 (0.001) loss 0.5701 (1.1391) lr 2.7103e-04 eta 7:15:48
epoch [44/50] batch [1880/2000] time 2.198 (2.155) data 0.000 (0.001) loss 2.1463 (1.1390) lr 2.7103e-04 eta 7:15:22
epoch [44/50] batch [1900/2000] time 2.049 (2.154) data 0.000 (0.001) loss 0.3049 (1.1375) lr 2.7103e-04 eta 7:14:26
epoch [44/50] batch [1920/2000] time 2.066 (2.153) data 0.000 (0.001) loss 0.1722 (1.1368) lr 2.7103e-04 eta 7:13:30
epoch [44/50] batch [1940/2000] time 2.066 (2.152) data 0.001 (0.001) loss 0.5693 (1.1356) lr 2.7103e-04 eta 7:12:34
epoch [44/50] batch [1960/2000] time 2.008 (2.151) data 0.000 (0.001) loss 0.3590 (1.1376) lr 2.7103e-04 eta 7:11:38
epoch [44/50] batch [1980/2000] time 2.063 (2.150) data 0.000 (0.001) loss 2.4607 (1.1370) lr 2.7103e-04 eta 7:10:42
epoch [44/50] batch [2000/2000] time 2.063 (2.149) data 0.000 (0.001) loss 2.3263 (1.1395) lr 2.2949e-04 eta 7:09:46
epoch [45/50] batch [20/2000] time 2.066 (2.083) data 0.000 (0.034) loss 0.1405 (0.9302) lr 2.2949e-04 eta 6:55:56
epoch [45/50] batch [40/2000] time 2.069 (2.066) data 0.000 (0.017) loss 0.3473 (1.0882) lr 2.2949e-04 eta 6:51:53
epoch [45/50] batch [60/2000] time 2.069 (2.059) data 0.001 (0.012) loss 0.8235 (1.1366) lr 2.2949e-04 eta 6:49:47
epoch [45/50] batch [80/2000] time 2.039 (2.054) data 0.000 (0.009) loss 0.8690 (1.1438) lr 2.2949e-04 eta 6:48:06
epoch [45/50] batch [100/2000] time 2.063 (2.053) data 0.000 (0.007) loss 1.3180 (1.1541) lr 2.2949e-04 eta 6:47:08
epoch [45/50] batch [120/2000] time 2.074 (2.053) data 0.000 (0.006) loss 0.7800 (1.2040) lr 2.2949e-04 eta 6:46:28
epoch [45/50] batch [140/2000] time 2.068 (2.051) data 0.000 (0.005) loss 0.5223 (1.2233) lr 2.2949e-04 eta 6:45:23
epoch [45/50] batch [160/2000] time 2.066 (2.050) data 0.000 (0.005) loss 0.9231 (1.1803) lr 2.2949e-04 eta 6:44:33
epoch [45/50] batch [180/2000] time 2.068 (2.050) data 0.000 (0.004) loss 0.5012 (1.1827) lr 2.2949e-04 eta 6:43:49
epoch [45/50] batch [200/2000] time 2.025 (2.049) data 0.000 (0.004) loss 3.0169 (1.1931) lr 2.2949e-04 eta 6:43:02
epoch [45/50] batch [220/2000] time 2.047 (2.049) data 0.000 (0.003) loss 0.3925 (1.1921) lr 2.2949e-04 eta 6:42:22
epoch [45/50] batch [240/2000] time 2.062 (2.049) data 0.000 (0.003) loss 0.1653 (1.1969) lr 2.2949e-04 eta 6:41:40
epoch [45/50] batch [260/2000] time 2.042 (2.050) data 0.000 (0.003) loss 4.3202 (1.2340) lr 2.2949e-04 eta 6:41:01
epoch [45/50] batch [280/2000] time 2.068 (2.049) data 0.000 (0.003) loss 0.7332 (1.2409) lr 2.2949e-04 eta 6:40:19
epoch [45/50] batch [300/2000] time 2.043 (2.049) data 0.000 (0.003) loss 1.2164 (1.2328) lr 2.2949e-04 eta 6:39:33
epoch [45/50] batch [320/2000] time 2.043 (2.049) data 0.000 (0.002) loss 2.8752 (1.2269) lr 2.2949e-04 eta 6:38:51
epoch [45/50] batch [340/2000] time 2.043 (2.049) data 0.000 (0.002) loss 1.8828 (1.2290) lr 2.2949e-04 eta 6:38:13
epoch [45/50] batch [360/2000] time 2.074 (2.048) data 0.000 (0.002) loss 1.1386 (1.2198) lr 2.2949e-04 eta 6:37:23
epoch [45/50] batch [380/2000] time 2.066 (2.048) data 0.000 (0.002) loss 2.8525 (1.2157) lr 2.2949e-04 eta 6:36:42
epoch [45/50] batch [400/2000] time 1.984 (2.048) data 0.000 (0.002) loss 2.6479 (1.2244) lr 2.2949e-04 eta 6:36:00
epoch [45/50] batch [420/2000] time 2.010 (2.048) data 0.000 (0.002) loss 1.7605 (1.2228) lr 2.2949e-04 eta 6:35:17
epoch [45/50] batch [440/2000] time 2.011 (2.048) data 0.000 (0.002) loss 0.1287 (1.2159) lr 2.2949e-04 eta 6:34:32
epoch [45/50] batch [460/2000] time 2.011 (2.048) data 0.000 (0.002) loss 1.3511 (1.2139) lr 2.2949e-04 eta 6:33:50
epoch [45/50] batch [480/2000] time 2.048 (2.047) data 0.000 (0.002) loss 2.8025 (1.2301) lr 2.2949e-04 eta 6:33:04
epoch [45/50] batch [500/2000] time 2.166 (2.056) data 0.000 (0.002) loss 0.5724 (1.2244) lr 2.2949e-04 eta 6:33:58
epoch [45/50] batch [520/2000] time 2.591 (2.065) data 0.000 (0.002) loss 3.5857 (1.2135) lr 2.2949e-04 eta 6:35:04
epoch [45/50] batch [540/2000] time 2.130 (2.073) data 0.000 (0.002) loss 0.3380 (1.2228) lr 2.2949e-04 eta 6:36:00
epoch [45/50] batch [560/2000] time 2.481 (2.082) data 0.000 (0.002) loss 1.5050 (1.2179) lr 2.2949e-04 eta 6:36:53
epoch [45/50] batch [580/2000] time 2.146 (2.089) data 0.001 (0.002) loss 4.0025 (1.2196) lr 2.2949e-04 eta 6:37:34
epoch [45/50] batch [600/2000] time 2.232 (2.097) data 0.001 (0.002) loss 0.8588 (1.2082) lr 2.2949e-04 eta 6:38:22
epoch [45/50] batch [620/2000] time 2.518 (2.103) data 0.000 (0.002) loss 2.7491 (1.2129) lr 2.2949e-04 eta 6:38:57
epoch [45/50] batch [640/2000] time 2.327 (2.109) data 0.000 (0.002) loss 0.1577 (1.2126) lr 2.2949e-04 eta 6:39:21
epoch [45/50] batch [660/2000] time 2.133 (2.115) data 0.000 (0.001) loss 0.3816 (1.1961) lr 2.2949e-04 eta 6:39:45
epoch [45/50] batch [680/2000] time 2.560 (2.121) data 0.000 (0.001) loss 3.6232 (1.1882) lr 2.2949e-04 eta 6:40:06
epoch [45/50] batch [700/2000] time 2.134 (2.125) data 0.000 (0.001) loss 1.8056 (1.1929) lr 2.2949e-04 eta 6:40:11
epoch [45/50] batch [720/2000] time 2.186 (2.130) data 0.001 (0.001) loss 0.7584 (1.1852) lr 2.2949e-04 eta 6:40:30
epoch [45/50] batch [740/2000] time 2.434 (2.135) data 0.000 (0.001) loss 1.3609 (1.1851) lr 2.2949e-04 eta 6:40:37
epoch [45/50] batch [760/2000] time 2.199 (2.139) data 0.000 (0.001) loss 1.6565 (1.1835) lr 2.2949e-04 eta 6:40:40
epoch [45/50] batch [780/2000] time 2.006 (2.137) data 0.000 (0.001) loss 1.1399 (1.1787) lr 2.2949e-04 eta 6:39:35
epoch [45/50] batch [800/2000] time 2.062 (2.134) data 0.000 (0.001) loss 1.0792 (1.1839) lr 2.2949e-04 eta 6:38:25
epoch [45/50] batch [820/2000] time 2.058 (2.132) data 0.000 (0.001) loss 0.5208 (1.1816) lr 2.2949e-04 eta 6:37:17
epoch [45/50] batch [840/2000] time 2.037 (2.130) data 0.001 (0.001) loss 1.1137 (1.1793) lr 2.2949e-04 eta 6:36:09
epoch [45/50] batch [860/2000] time 2.009 (2.128) data 0.000 (0.001) loss 0.8529 (1.1752) lr 2.2949e-04 eta 6:35:04
epoch [45/50] batch [880/2000] time 2.064 (2.126) data 0.000 (0.001) loss 1.0219 (1.1644) lr 2.2949e-04 eta 6:34:00
epoch [45/50] batch [900/2000] time 2.039 (2.124) data 0.000 (0.001) loss 4.1241 (1.1586) lr 2.2949e-04 eta 6:32:54
epoch [45/50] batch [920/2000] time 2.063 (2.122) data 0.000 (0.001) loss 1.0532 (1.1592) lr 2.2949e-04 eta 6:31:49
epoch [45/50] batch [940/2000] time 2.057 (2.120) data 0.000 (0.001) loss 6.0140 (1.1576) lr 2.2949e-04 eta 6:30:48
epoch [45/50] batch [960/2000] time 2.056 (2.119) data 0.000 (0.001) loss 1.8182 (1.1583) lr 2.2949e-04 eta 6:29:48
epoch [45/50] batch [980/2000] time 2.036 (2.117) data 0.000 (0.001) loss 1.1765 (1.1550) lr 2.2949e-04 eta 6:28:48
epoch [45/50] batch [1000/2000] time 2.006 (2.115) data 0.000 (0.001) loss 1.7246 (1.1512) lr 2.2949e-04 eta 6:27:48
epoch [45/50] batch [1020/2000] time 2.008 (2.114) data 0.000 (0.001) loss 1.4066 (1.1525) lr 2.2949e-04 eta 6:26:51
epoch [45/50] batch [1040/2000] time 2.011 (2.113) data 0.000 (0.001) loss 0.8556 (1.1646) lr 2.2949e-04 eta 6:25:53
epoch [45/50] batch [1060/2000] time 2.007 (2.111) data 0.000 (0.001) loss 1.3776 (1.1674) lr 2.2949e-04 eta 6:24:55
epoch [45/50] batch [1080/2000] time 2.034 (2.110) data 0.000 (0.001) loss 0.7295 (1.1708) lr 2.2949e-04 eta 6:23:57
epoch [45/50] batch [1100/2000] time 2.007 (2.108) data 0.001 (0.001) loss 2.8580 (1.1713) lr 2.2949e-04 eta 6:23:01
epoch [45/50] batch [1120/2000] time 2.061 (2.107) data 0.000 (0.001) loss 0.8938 (1.1740) lr 2.2949e-04 eta 6:22:05
epoch [45/50] batch [1140/2000] time 2.066 (2.106) data 0.001 (0.001) loss 1.4552 (1.1807) lr 2.2949e-04 eta 6:21:10
epoch [45/50] batch [1160/2000] time 2.006 (2.105) data 0.000 (0.001) loss 0.2715 (1.1771) lr 2.2949e-04 eta 6:20:16
epoch [45/50] batch [1180/2000] time 2.041 (2.104) data 0.000 (0.001) loss 0.4417 (1.1721) lr 2.2949e-04 eta 6:19:22
epoch [45/50] batch [1200/2000] time 2.185 (2.105) data 0.000 (0.001) loss 0.6188 (1.1700) lr 2.2949e-04 eta 6:18:55
epoch [45/50] batch [1220/2000] time 2.213 (2.109) data 0.001 (0.001) loss 1.1355 (1.1740) lr 2.2949e-04 eta 6:18:52
epoch [45/50] batch [1240/2000] time 2.528 (2.112) data 0.000 (0.001) loss 2.3667 (1.1694) lr 2.2949e-04 eta 6:18:44
epoch [45/50] batch [1260/2000] time 2.162 (2.115) data 0.000 (0.001) loss 0.2912 (1.1674) lr 2.2949e-04 eta 6:18:33
epoch [45/50] batch [1280/2000] time 2.124 (2.118) data 0.000 (0.001) loss 0.4133 (1.1654) lr 2.2949e-04 eta 6:18:24
epoch [45/50] batch [1300/2000] time 2.492 (2.121) data 0.000 (0.001) loss 0.4777 (1.1630) lr 2.2949e-04 eta 6:18:14
epoch [45/50] batch [1320/2000] time 2.342 (2.123) data 0.000 (0.001) loss 0.5494 (1.1636) lr 2.2949e-04 eta 6:17:58
epoch [45/50] batch [1340/2000] time 2.195 (2.126) data 0.000 (0.001) loss 1.8475 (1.1606) lr 2.2949e-04 eta 6:17:44
epoch [45/50] batch [1360/2000] time 2.165 (2.129) data 0.000 (0.001) loss 0.5923 (1.1605) lr 2.2949e-04 eta 6:17:29
epoch [45/50] batch [1380/2000] time 2.516 (2.131) data 0.000 (0.001) loss 1.1329 (1.1606) lr 2.2949e-04 eta 6:17:11
epoch [45/50] batch [1400/2000] time 2.147 (2.133) data 0.000 (0.001) loss 1.7241 (1.1620) lr 2.2949e-04 eta 6:16:51
epoch [45/50] batch [1420/2000] time 2.261 (2.136) data 0.000 (0.001) loss 0.5293 (1.1561) lr 2.2949e-04 eta 6:16:34
epoch [45/50] batch [1440/2000] time 2.325 (2.138) data 0.000 (0.001) loss 1.0390 (1.1557) lr 2.2949e-04 eta 6:16:14
epoch [45/50] batch [1460/2000] time 2.149 (2.140) data 0.000 (0.001) loss 3.0145 (1.1555) lr 2.2949e-04 eta 6:15:54
epoch [45/50] batch [1480/2000] time 2.054 (2.139) data 0.000 (0.001) loss 4.5824 (1.1566) lr 2.2949e-04 eta 6:14:59
epoch [45/50] batch [1500/2000] time 2.002 (2.137) data 0.000 (0.001) loss 0.1149 (1.1608) lr 2.2949e-04 eta 6:14:01
epoch [45/50] batch [1520/2000] time 2.054 (2.136) data 0.000 (0.001) loss 3.3911 (1.1592) lr 2.2949e-04 eta 6:13:04
epoch [45/50] batch [1540/2000] time 2.057 (2.135) data 0.000 (0.001) loss 2.4129 (1.1586) lr 2.2949e-04 eta 6:12:07
epoch [45/50] batch [1560/2000] time 2.056 (2.133) data 0.000 (0.001) loss 0.2665 (1.1574) lr 2.2949e-04 eta 6:11:11
epoch [45/50] batch [1580/2000] time 2.055 (2.132) data 0.000 (0.001) loss 2.6593 (1.1566) lr 2.2949e-04 eta 6:10:15
epoch [45/50] batch [1600/2000] time 2.002 (2.131) data 0.000 (0.001) loss 0.8778 (1.1521) lr 2.2949e-04 eta 6:09:18
epoch [45/50] batch [1620/2000] time 2.001 (2.129) data 0.000 (0.001) loss 0.4101 (1.1482) lr 2.2949e-04 eta 6:08:23
epoch [45/50] batch [1640/2000] time 2.059 (2.128) data 0.000 (0.001) loss 0.9189 (1.1479) lr 2.2949e-04 eta 6:07:29
epoch [45/50] batch [1660/2000] time 1.984 (2.127) data 0.000 (0.001) loss 2.5160 (1.1458) lr 2.2949e-04 eta 6:06:34
epoch [45/50] batch [1680/2000] time 2.052 (2.126) data 0.001 (0.001) loss 1.5885 (1.1459) lr 2.2949e-04 eta 6:05:40
epoch [45/50] batch [1700/2000] time 2.051 (2.125) data 0.000 (0.001) loss 0.6721 (1.1420) lr 2.2949e-04 eta 6:04:45
epoch [45/50] batch [1720/2000] time 2.060 (2.124) data 0.000 (0.001) loss 1.2107 (1.1397) lr 2.2949e-04 eta 6:03:52
epoch [45/50] batch [1740/2000] time 2.061 (2.123) data 0.000 (0.001) loss 0.2074 (1.1396) lr 2.2949e-04 eta 6:03:01
epoch [45/50] batch [1760/2000] time 2.058 (2.122) data 0.000 (0.001) loss 0.6929 (1.1358) lr 2.2949e-04 eta 6:02:09
epoch [45/50] batch [1780/2000] time 2.063 (2.121) data 0.000 (0.001) loss 0.4515 (1.1350) lr 2.2949e-04 eta 6:01:17
epoch [45/50] batch [1800/2000] time 2.002 (2.120) data 0.000 (0.001) loss 0.7697 (1.1365) lr 2.2949e-04 eta 6:00:25
epoch [45/50] batch [1820/2000] time 1.999 (2.119) data 0.000 (0.001) loss 1.0804 (1.1373) lr 2.2949e-04 eta 5:59:32
epoch [45/50] batch [1840/2000] time 2.037 (2.118) data 0.000 (0.001) loss 0.0853 (1.1368) lr 2.2949e-04 eta 5:58:39
epoch [45/50] batch [1860/2000] time 2.056 (2.117) data 0.000 (0.001) loss 0.1689 (1.1360) lr 2.2949e-04 eta 5:57:48
epoch [45/50] batch [1880/2000] time 2.058 (2.116) data 0.000 (0.001) loss 0.9186 (1.1367) lr 2.2949e-04 eta 5:56:56
epoch [45/50] batch [1900/2000] time 2.001 (2.115) data 0.000 (0.001) loss 0.6162 (1.1344) lr 2.2949e-04 eta 5:56:05
epoch [45/50] batch [1920/2000] time 2.007 (2.114) data 0.000 (0.001) loss 0.5075 (1.1340) lr 2.2949e-04 eta 5:55:13
epoch [45/50] batch [1940/2000] time 1.975 (2.114) data 0.000 (0.001) loss 0.7092 (1.1353) lr 2.2949e-04 eta 5:54:22
epoch [45/50] batch [1960/2000] time 2.058 (2.113) data 0.000 (0.001) loss 0.2082 (1.1366) lr 2.2949e-04 eta 5:53:31
epoch [45/50] batch [1980/2000] time 2.058 (2.112) data 0.000 (0.001) loss 0.6296 (1.1382) lr 2.2949e-04 eta 5:52:41
epoch [45/50] batch [2000/2000] time 2.033 (2.111) data 0.000 (0.001) loss 0.4760 (1.1390) lr 1.9098e-04 eta 5:51:50
epoch [46/50] batch [20/2000] time 2.060 (2.076) data 0.000 (0.034) loss 0.1894 (0.8413) lr 1.9098e-04 eta 5:45:15
epoch [46/50] batch [40/2000] time 2.001 (2.052) data 0.000 (0.017) loss 0.3097 (1.1220) lr 1.9098e-04 eta 5:40:34
epoch [46/50] batch [60/2000] time 2.054 (2.047) data 0.001 (0.012) loss 0.7616 (1.0912) lr 1.9098e-04 eta 5:39:11
epoch [46/50] batch [80/2000] time 2.055 (2.043) data 0.000 (0.009) loss 2.0974 (1.1528) lr 1.9098e-04 eta 5:37:47
epoch [46/50] batch [100/2000] time 2.034 (2.041) data 0.000 (0.007) loss 0.6605 (1.1125) lr 1.9098e-04 eta 5:36:45
epoch [46/50] batch [120/2000] time 2.002 (2.039) data 0.000 (0.006) loss 1.5276 (1.0768) lr 1.9098e-04 eta 5:35:47
epoch [46/50] batch [140/2000] time 2.056 (2.040) data 0.000 (0.005) loss 0.3174 (1.0669) lr 1.9098e-04 eta 5:35:13
epoch [46/50] batch [160/2000] time 2.053 (2.039) data 0.000 (0.004) loss 1.5391 (1.1125) lr 1.9098e-04 eta 5:34:24
epoch [46/50] batch [180/2000] time 2.002 (2.038) data 0.000 (0.004) loss 0.5843 (1.1308) lr 1.9098e-04 eta 5:33:28
epoch [46/50] batch [200/2000] time 1.982 (2.037) data 0.000 (0.004) loss 1.1384 (1.1045) lr 1.9098e-04 eta 5:32:40
epoch [46/50] batch [220/2000] time 2.060 (2.037) data 0.000 (0.003) loss 0.7279 (1.1327) lr 1.9098e-04 eta 5:31:57
epoch [46/50] batch [240/2000] time 2.029 (2.037) data 0.000 (0.003) loss 0.4020 (1.1102) lr 1.9098e-04 eta 5:31:21
epoch [46/50] batch [260/2000] time 2.029 (2.037) data 0.000 (0.003) loss 0.4919 (1.1037) lr 1.9098e-04 eta 5:30:38
epoch [46/50] batch [280/2000] time 2.002 (2.036) data 0.000 (0.003) loss 0.1831 (1.0843) lr 1.9098e-04 eta 5:29:54
epoch [46/50] batch [300/2000] time 1.977 (2.036) data 0.000 (0.003) loss 0.2169 (1.0937) lr 1.9098e-04 eta 5:29:08
epoch [46/50] batch [320/2000] time 2.000 (2.035) data 0.000 (0.002) loss 1.5890 (1.1227) lr 1.9098e-04 eta 5:28:22
epoch [46/50] batch [340/2000] time 2.026 (2.035) data 0.000 (0.002) loss 0.5680 (1.1493) lr 1.9098e-04 eta 5:27:40
epoch [46/50] batch [360/2000] time 2.053 (2.035) data 0.000 (0.002) loss 0.3681 (1.1502) lr 1.9098e-04 eta 5:27:00
epoch [46/50] batch [380/2000] time 2.052 (2.035) data 0.000 (0.002) loss 1.0233 (1.1527) lr 1.9098e-04 eta 5:26:14
epoch [46/50] batch [400/2000] time 2.005 (2.035) data 0.000 (0.002) loss 2.0309 (1.1458) lr 1.9098e-04 eta 5:25:35
epoch [46/50] batch [420/2000] time 2.057 (2.035) data 0.000 (0.002) loss 0.2394 (1.1588) lr 1.9098e-04 eta 5:24:55
epoch [46/50] batch [440/2000] time 2.000 (2.035) data 0.000 (0.002) loss 0.4956 (1.1632) lr 1.9098e-04 eta 5:24:15
epoch [46/50] batch [460/2000] time 2.050 (2.035) data 0.000 (0.002) loss 1.0352 (1.1537) lr 1.9098e-04 eta 5:23:31
epoch [46/50] batch [480/2000] time 2.051 (2.034) data 0.000 (0.002) loss 0.1915 (1.1532) lr 1.9098e-04 eta 5:22:47
epoch [46/50] batch [500/2000] time 2.002 (2.034) data 0.000 (0.002) loss 0.3120 (1.1472) lr 1.9098e-04 eta 5:22:03
epoch [46/50] batch [520/2000] time 2.034 (2.034) data 0.000 (0.002) loss 0.5092 (1.1405) lr 1.9098e-04 eta 5:21:20
epoch [46/50] batch [540/2000] time 1.981 (2.034) data 0.000 (0.001) loss 1.2149 (1.1330) lr 1.9098e-04 eta 5:20:42
epoch [46/50] batch [560/2000] time 2.007 (2.034) data 0.000 (0.001) loss 0.6151 (1.1235) lr 1.9098e-04 eta 5:20:01
epoch [46/50] batch [580/2000] time 2.034 (2.034) data 0.000 (0.001) loss 2.3949 (1.1255) lr 1.9098e-04 eta 5:19:22
epoch [46/50] batch [600/2000] time 2.001 (2.034) data 0.001 (0.001) loss 2.4950 (1.1266) lr 1.9098e-04 eta 5:18:40
epoch [46/50] batch [620/2000] time 2.056 (2.034) data 0.000 (0.001) loss 0.9805 (1.1206) lr 1.9098e-04 eta 5:17:59
epoch [46/50] batch [640/2000] time 2.057 (2.034) data 0.000 (0.001) loss 1.1153 (1.1117) lr 1.9098e-04 eta 5:17:19
epoch [46/50] batch [660/2000] time 2.029 (2.034) data 0.000 (0.001) loss 1.2752 (1.1012) lr 1.9098e-04 eta 5:16:36
epoch [46/50] batch [680/2000] time 2.004 (2.034) data 0.000 (0.001) loss 0.3368 (1.1073) lr 1.9098e-04 eta 5:15:56
epoch [46/50] batch [700/2000] time 2.052 (2.034) data 0.000 (0.001) loss 2.1323 (1.1086) lr 1.9098e-04 eta 5:15:15
epoch [46/50] batch [720/2000] time 2.007 (2.034) data 0.000 (0.001) loss 0.6440 (1.1155) lr 1.9098e-04 eta 5:14:32
epoch [46/50] batch [740/2000] time 2.061 (2.034) data 0.000 (0.001) loss 0.7465 (1.1131) lr 1.9098e-04 eta 5:13:53
epoch [46/50] batch [760/2000] time 2.057 (2.034) data 0.000 (0.001) loss 0.5555 (1.1114) lr 1.9098e-04 eta 5:13:13
epoch [46/50] batch [780/2000] time 2.033 (2.034) data 0.000 (0.001) loss 1.3254 (1.1128) lr 1.9098e-04 eta 5:12:31
epoch [46/50] batch [800/2000] time 2.056 (2.034) data 0.000 (0.001) loss 0.5087 (1.1209) lr 1.9098e-04 eta 5:11:52
epoch [46/50] batch [820/2000] time 2.056 (2.034) data 0.000 (0.001) loss 0.2598 (1.1208) lr 1.9098e-04 eta 5:11:11
epoch [46/50] batch [840/2000] time 2.036 (2.034) data 0.000 (0.001) loss 0.6821 (1.1167) lr 1.9098e-04 eta 5:10:31
epoch [46/50] batch [860/2000] time 2.000 (2.034) data 0.000 (0.001) loss 0.0459 (1.1176) lr 1.9098e-04 eta 5:09:51
epoch [46/50] batch [880/2000] time 2.062 (2.034) data 0.000 (0.001) loss 3.5220 (1.1273) lr 1.9098e-04 eta 5:09:09
epoch [46/50] batch [900/2000] time 2.061 (2.034) data 0.000 (0.001) loss 0.2399 (1.1236) lr 1.9098e-04 eta 5:08:29
epoch [46/50] batch [920/2000] time 2.001 (2.034) data 0.000 (0.001) loss 0.6769 (1.1202) lr 1.9098e-04 eta 5:07:47
epoch [46/50] batch [940/2000] time 2.040 (2.034) data 0.000 (0.001) loss 1.2573 (1.1236) lr 1.9098e-04 eta 5:07:07
epoch [46/50] batch [960/2000] time 2.008 (2.034) data 0.000 (0.001) loss 0.9180 (1.1280) lr 1.9098e-04 eta 5:06:26
epoch [46/50] batch [980/2000] time 2.064 (2.034) data 0.000 (0.001) loss 0.2683 (1.1240) lr 1.9098e-04 eta 5:05:48
epoch [46/50] batch [1000/2000] time 2.038 (2.034) data 0.000 (0.001) loss 0.7501 (1.1260) lr 1.9098e-04 eta 5:05:08
epoch [46/50] batch [1020/2000] time 2.041 (2.034) data 0.000 (0.001) loss 2.1242 (1.1230) lr 1.9098e-04 eta 5:04:28
epoch [46/50] batch [1040/2000] time 2.004 (2.034) data 0.000 (0.001) loss 1.4145 (1.1298) lr 1.9098e-04 eta 5:03:48
epoch [46/50] batch [1060/2000] time 2.059 (2.034) data 0.000 (0.001) loss 2.3829 (1.1346) lr 1.9098e-04 eta 5:03:08
epoch [46/50] batch [1080/2000] time 2.061 (2.034) data 0.000 (0.001) loss 0.7680 (1.1379) lr 1.9098e-04 eta 5:02:27
epoch [46/50] batch [1100/2000] time 1.977 (2.034) data 0.000 (0.001) loss 2.2274 (1.1410) lr 1.9098e-04 eta 5:01:46
epoch [46/50] batch [1120/2000] time 2.005 (2.035) data 0.000 (0.001) loss 2.2088 (1.1480) lr 1.9098e-04 eta 5:01:06
epoch [46/50] batch [1140/2000] time 2.004 (2.034) data 0.001 (0.001) loss 0.7215 (1.1416) lr 1.9098e-04 eta 5:00:25
epoch [46/50] batch [1160/2000] time 1.975 (2.034) data 0.000 (0.001) loss 1.3743 (1.1411) lr 1.9098e-04 eta 4:59:42
epoch [46/50] batch [1180/2000] time 2.055 (2.034) data 0.000 (0.001) loss 1.6255 (1.1400) lr 1.9098e-04 eta 4:59:00
epoch [46/50] batch [1200/2000] time 2.032 (2.034) data 0.000 (0.001) loss 1.6042 (1.1352) lr 1.9098e-04 eta 4:58:19
epoch [46/50] batch [1220/2000] time 2.056 (2.034) data 0.000 (0.001) loss 2.2272 (1.1358) lr 1.9098e-04 eta 4:57:39
epoch [46/50] batch [1240/2000] time 2.057 (2.034) data 0.000 (0.001) loss 0.1338 (1.1375) lr 1.9098e-04 eta 4:56:58
epoch [46/50] batch [1260/2000] time 1.997 (2.034) data 0.000 (0.001) loss 0.9289 (1.1339) lr 1.9098e-04 eta 4:56:17
epoch [46/50] batch [1280/2000] time 2.056 (2.034) data 0.000 (0.001) loss 0.7365 (1.1329) lr 1.9098e-04 eta 4:55:36
epoch [46/50] batch [1300/2000] time 2.055 (2.034) data 0.000 (0.001) loss 1.4280 (1.1336) lr 1.9098e-04 eta 4:54:56
epoch [46/50] batch [1320/2000] time 2.053 (2.034) data 0.000 (0.001) loss 1.7672 (1.1342) lr 1.9098e-04 eta 4:54:15
epoch [46/50] batch [1340/2000] time 2.062 (2.034) data 0.000 (0.001) loss 1.9738 (1.1341) lr 1.9098e-04 eta 4:53:35
epoch [46/50] batch [1360/2000] time 2.038 (2.034) data 0.000 (0.001) loss 0.7942 (1.1360) lr 1.9098e-04 eta 4:52:56
epoch [46/50] batch [1380/2000] time 2.059 (2.034) data 0.000 (0.001) loss 1.7169 (1.1400) lr 1.9098e-04 eta 4:52:15
epoch [46/50] batch [1400/2000] time 2.003 (2.034) data 0.000 (0.001) loss 0.5668 (1.1391) lr 1.9098e-04 eta 4:51:34
epoch [46/50] batch [1420/2000] time 2.039 (2.034) data 0.000 (0.001) loss 0.5528 (1.1410) lr 1.9098e-04 eta 4:50:54
epoch [46/50] batch [1440/2000] time 2.009 (2.034) data 0.000 (0.001) loss 2.5966 (1.1434) lr 1.9098e-04 eta 4:50:14
epoch [46/50] batch [1460/2000] time 1.999 (2.034) data 0.000 (0.001) loss 1.1739 (1.1412) lr 1.9098e-04 eta 4:49:34
epoch [46/50] batch [1480/2000] time 1.999 (2.034) data 0.000 (0.001) loss 2.3293 (1.1442) lr 1.9098e-04 eta 4:48:53
epoch [46/50] batch [1500/2000] time 2.007 (2.034) data 0.000 (0.001) loss 2.0260 (1.1420) lr 1.9098e-04 eta 4:48:12
epoch [46/50] batch [1520/2000] time 2.062 (2.035) data 0.000 (0.001) loss 0.2787 (1.1394) lr 1.9098e-04 eta 4:47:32
epoch [46/50] batch [1540/2000] time 2.061 (2.035) data 0.000 (0.001) loss 0.6053 (1.1382) lr 1.9098e-04 eta 4:46:52
epoch [46/50] batch [1560/2000] time 2.033 (2.034) data 0.000 (0.001) loss 0.2195 (1.1359) lr 1.9098e-04 eta 4:46:10
epoch [46/50] batch [1580/2000] time 2.000 (2.034) data 0.000 (0.001) loss 3.4036 (1.1376) lr 1.9098e-04 eta 4:45:29
epoch [46/50] batch [1600/2000] time 2.060 (2.034) data 0.000 (0.001) loss 2.4057 (1.1368) lr 1.9098e-04 eta 4:44:49
epoch [46/50] batch [1620/2000] time 2.001 (2.034) data 0.000 (0.001) loss 0.3655 (1.1315) lr 1.9098e-04 eta 4:44:08
epoch [46/50] batch [1640/2000] time 2.034 (2.034) data 0.000 (0.001) loss 2.2534 (1.1375) lr 1.9098e-04 eta 4:43:27
epoch [46/50] batch [1660/2000] time 2.058 (2.035) data 0.000 (0.001) loss 2.8582 (1.1404) lr 1.9098e-04 eta 4:42:48
epoch [46/50] batch [1680/2000] time 2.003 (2.035) data 0.001 (0.001) loss 1.2785 (1.1389) lr 1.9098e-04 eta 4:42:07
epoch [46/50] batch [1700/2000] time 2.060 (2.035) data 0.000 (0.001) loss 2.6884 (1.1452) lr 1.9098e-04 eta 4:41:27
epoch [46/50] batch [1720/2000] time 2.058 (2.035) data 0.000 (0.001) loss 0.4744 (1.1493) lr 1.9098e-04 eta 4:40:46
epoch [46/50] batch [1740/2000] time 2.003 (2.035) data 0.000 (0.001) loss 1.2672 (1.1475) lr 1.9098e-04 eta 4:40:05
epoch [46/50] batch [1760/2000] time 1.974 (2.035) data 0.000 (0.001) loss 2.1343 (1.1465) lr 1.9098e-04 eta 4:39:24
epoch [46/50] batch [1780/2000] time 2.054 (2.035) data 0.000 (0.001) loss 1.0227 (1.1502) lr 1.9098e-04 eta 4:38:43
epoch [46/50] batch [1800/2000] time 2.061 (2.035) data 0.000 (0.001) loss 1.6840 (1.1502) lr 1.9098e-04 eta 4:38:03
epoch [46/50] batch [1820/2000] time 2.054 (2.035) data 0.000 (0.001) loss 0.1761 (1.1475) lr 1.9098e-04 eta 4:37:22
epoch [46/50] batch [1840/2000] time 2.035 (2.035) data 0.000 (0.001) loss 1.0547 (1.1470) lr 1.9098e-04 eta 4:36:42
epoch [46/50] batch [1860/2000] time 2.059 (2.035) data 0.000 (0.001) loss 0.1053 (1.1449) lr 1.9098e-04 eta 4:36:01
epoch [46/50] batch [1880/2000] time 2.053 (2.035) data 0.000 (0.001) loss 1.1030 (1.1427) lr 1.9098e-04 eta 4:35:20
epoch [46/50] batch [1900/2000] time 2.000 (2.035) data 0.000 (0.001) loss 0.5144 (1.1450) lr 1.9098e-04 eta 4:34:39
epoch [46/50] batch [1920/2000] time 2.002 (2.035) data 0.000 (0.001) loss 1.8975 (1.1451) lr 1.9098e-04 eta 4:33:58
epoch [46/50] batch [1940/2000] time 2.060 (2.035) data 0.000 (0.001) loss 0.4791 (1.1428) lr 1.9098e-04 eta 4:33:18
epoch [46/50] batch [1960/2000] time 2.038 (2.035) data 0.000 (0.001) loss 0.4739 (1.1420) lr 1.9098e-04 eta 4:32:37
epoch [46/50] batch [1980/2000] time 2.061 (2.035) data 0.000 (0.001) loss 0.5044 (1.1426) lr 1.9098e-04 eta 4:31:57
epoch [46/50] batch [2000/2000] time 1.999 (2.035) data 0.000 (0.001) loss 2.0689 (1.1420) lr 1.5567e-04 eta 4:31:16
epoch [47/50] batch [20/2000] time 2.008 (2.074) data 0.000 (0.034) loss 1.4366 (0.9994) lr 1.5567e-04 eta 4:35:46
epoch [47/50] batch [40/2000] time 2.037 (2.059) data 0.000 (0.017) loss 3.1441 (1.1348) lr 1.5567e-04 eta 4:33:12
epoch [47/50] batch [60/2000] time 2.062 (2.053) data 0.000 (0.012) loss 1.2039 (1.0621) lr 1.5567e-04 eta 4:31:44
epoch [47/50] batch [80/2000] time 2.005 (2.050) data 0.000 (0.009) loss 1.6999 (1.0035) lr 1.5567e-04 eta 4:30:37
epoch [47/50] batch [100/2000] time 2.063 (2.047) data 0.000 (0.007) loss 2.5772 (0.9682) lr 1.5567e-04 eta 4:29:33
epoch [47/50] batch [120/2000] time 2.040 (2.046) data 0.000 (0.006) loss 0.3851 (1.0107) lr 1.5567e-04 eta 4:28:39
epoch [47/50] batch [140/2000] time 2.060 (2.044) data 0.000 (0.005) loss 0.6820 (1.0585) lr 1.5567e-04 eta 4:27:48
epoch [47/50] batch [160/2000] time 2.006 (2.043) data 0.000 (0.005) loss 0.8161 (1.0179) lr 1.5567e-04 eta 4:26:59
epoch [47/50] batch [180/2000] time 2.036 (2.043) data 0.000 (0.004) loss 0.6095 (1.0319) lr 1.5567e-04 eta 4:26:14
epoch [47/50] batch [200/2000] time 2.062 (2.042) data 0.000 (0.004) loss 2.1801 (1.0840) lr 1.5567e-04 eta 4:25:28
epoch [47/50] batch [220/2000] time 2.037 (2.042) data 0.000 (0.003) loss 1.2588 (1.0962) lr 1.5567e-04 eta 4:24:44
epoch [47/50] batch [240/2000] time 2.061 (2.041) data 0.000 (0.003) loss 0.0642 (1.0879) lr 1.5567e-04 eta 4:24:00
epoch [47/50] batch [260/2000] time 2.062 (2.042) data 0.000 (0.003) loss 0.6560 (1.1206) lr 1.5567e-04 eta 4:23:21
epoch [47/50] batch [280/2000] time 2.035 (2.041) data 0.000 (0.003) loss 0.7153 (1.1469) lr 1.5567e-04 eta 4:22:37
epoch [47/50] batch [300/2000] time 2.032 (2.041) data 0.000 (0.003) loss 1.0074 (1.1726) lr 1.5567e-04 eta 4:21:52
epoch [47/50] batch [320/2000] time 2.068 (2.040) data 0.000 (0.002) loss 0.9792 (1.1636) lr 1.5567e-04 eta 4:21:09
epoch [47/50] batch [340/2000] time 2.059 (2.040) data 0.000 (0.002) loss 1.1579 (1.1636) lr 1.5567e-04 eta 4:20:28
epoch [47/50] batch [360/2000] time 2.057 (2.040) data 0.000 (0.002) loss 1.5870 (1.1804) lr 1.5567e-04 eta 4:19:45
epoch [47/50] batch [380/2000] time 2.055 (2.040) data 0.000 (0.002) loss 1.7656 (1.1893) lr 1.5567e-04 eta 4:19:01
epoch [47/50] batch [400/2000] time 2.002 (2.039) data 0.000 (0.002) loss 2.1249 (1.1807) lr 1.5567e-04 eta 4:18:17
epoch [47/50] batch [420/2000] time 2.034 (2.039) data 0.000 (0.002) loss 1.1229 (1.1908) lr 1.5567e-04 eta 4:17:35
epoch [47/50] batch [440/2000] time 1.999 (2.039) data 0.000 (0.002) loss 1.2587 (1.1937) lr 1.5567e-04 eta 4:16:52
epoch [47/50] batch [460/2000] time 2.058 (2.039) data 0.000 (0.002) loss 0.8889 (1.1900) lr 1.5567e-04 eta 4:16:12
epoch [47/50] batch [480/2000] time 2.002 (2.039) data 0.000 (0.002) loss 1.1787 (1.1815) lr 1.5567e-04 eta 4:15:30
epoch [47/50] batch [500/2000] time 2.055 (2.038) data 0.000 (0.002) loss 2.0301 (1.1791) lr 1.5567e-04 eta 4:14:47
epoch [47/50] batch [520/2000] time 2.057 (2.038) data 0.000 (0.002) loss 2.8615 (1.1809) lr 1.5567e-04 eta 4:14:06
epoch [47/50] batch [540/2000] time 2.054 (2.038) data 0.000 (0.002) loss 0.0455 (1.1776) lr 1.5567e-04 eta 4:13:24
epoch [47/50] batch [560/2000] time 2.061 (2.038) data 0.000 (0.001) loss 0.0712 (1.1782) lr 1.5567e-04 eta 4:12:42
epoch [47/50] batch [580/2000] time 2.058 (2.038) data 0.000 (0.001) loss 0.8041 (1.1691) lr 1.5567e-04 eta 4:11:59
epoch [47/50] batch [600/2000] time 2.034 (2.038) data 0.000 (0.001) loss 0.0237 (1.1651) lr 1.5567e-04 eta 4:11:19
epoch [47/50] batch [620/2000] time 2.057 (2.037) data 0.000 (0.001) loss 0.4372 (1.1572) lr 1.5567e-04 eta 4:10:36
epoch [47/50] batch [640/2000] time 2.036 (2.038) data 0.000 (0.001) loss 2.0757 (1.1503) lr 1.5567e-04 eta 4:09:56
epoch [47/50] batch [660/2000] time 2.055 (2.038) data 0.000 (0.001) loss 0.1479 (1.1481) lr 1.5567e-04 eta 4:09:16
epoch [47/50] batch [680/2000] time 1.986 (2.038) data 0.000 (0.001) loss 0.1053 (1.1363) lr 1.5567e-04 eta 4:08:36
epoch [47/50] batch [700/2000] time 2.031 (2.038) data 0.000 (0.001) loss 0.8245 (1.1389) lr 1.5567e-04 eta 4:07:54
epoch [47/50] batch [720/2000] time 2.058 (2.038) data 0.000 (0.001) loss 2.5440 (1.1343) lr 1.5567e-04 eta 4:07:14
epoch [47/50] batch [740/2000] time 2.032 (2.038) data 0.000 (0.001) loss 1.1295 (1.1312) lr 1.5567e-04 eta 4:06:33
epoch [47/50] batch [760/2000] time 2.052 (2.037) data 0.000 (0.001) loss 0.7057 (1.1329) lr 1.5567e-04 eta 4:05:51
epoch [47/50] batch [780/2000] time 2.056 (2.037) data 0.000 (0.001) loss 0.0299 (1.1258) lr 1.5567e-04 eta 4:05:09
epoch [47/50] batch [800/2000] time 2.057 (2.037) data 0.000 (0.001) loss 1.7096 (1.1228) lr 1.5567e-04 eta 4:04:27
epoch [47/50] batch [820/2000] time 2.052 (2.037) data 0.000 (0.001) loss 1.3226 (1.1329) lr 1.5567e-04 eta 4:03:46
epoch [47/50] batch [840/2000] time 2.059 (2.037) data 0.000 (0.001) loss 0.8902 (1.1373) lr 1.5567e-04 eta 4:03:05
epoch [47/50] batch [860/2000] time 2.006 (2.037) data 0.000 (0.001) loss 2.7709 (1.1335) lr 1.5567e-04 eta 4:02:23
epoch [47/50] batch [880/2000] time 2.062 (2.037) data 0.000 (0.001) loss 0.0635 (1.1285) lr 1.5567e-04 eta 4:01:42
epoch [47/50] batch [900/2000] time 2.060 (2.037) data 0.000 (0.001) loss 1.9020 (1.1333) lr 1.5567e-04 eta 4:01:02
epoch [47/50] batch [920/2000] time 2.036 (2.037) data 0.000 (0.001) loss 1.6069 (1.1345) lr 1.5567e-04 eta 4:00:22
epoch [47/50] batch [940/2000] time 2.037 (2.037) data 0.000 (0.001) loss 3.1292 (1.1399) lr 1.5567e-04 eta 3:59:42
epoch [47/50] batch [960/2000] time 2.005 (2.037) data 0.000 (0.001) loss 1.6067 (1.1328) lr 1.5567e-04 eta 3:59:01
epoch [47/50] batch [980/2000] time 2.037 (2.037) data 0.000 (0.001) loss 0.9275 (1.1317) lr 1.5567e-04 eta 3:58:21
epoch [47/50] batch [1000/2000] time 2.060 (2.037) data 0.000 (0.001) loss 1.9068 (1.1354) lr 1.5567e-04 eta 3:57:39
epoch [47/50] batch [1020/2000] time 2.059 (2.037) data 0.000 (0.001) loss 0.7537 (1.1378) lr 1.5567e-04 eta 3:56:59
epoch [47/50] batch [1040/2000] time 1.997 (2.037) data 0.000 (0.001) loss 1.3342 (1.1351) lr 1.5567e-04 eta 3:56:18
epoch [47/50] batch [1060/2000] time 2.054 (2.037) data 0.000 (0.001) loss 1.7677 (1.1341) lr 1.5567e-04 eta 3:55:36
epoch [47/50] batch [1080/2000] time 2.027 (2.037) data 0.000 (0.001) loss 0.3202 (1.1303) lr 1.5567e-04 eta 3:54:55
epoch [47/50] batch [1100/2000] time 2.051 (2.037) data 0.000 (0.001) loss 1.9842 (1.1292) lr 1.5567e-04 eta 3:54:13
epoch [47/50] batch [1120/2000] time 2.031 (2.037) data 0.000 (0.001) loss 0.1123 (1.1352) lr 1.5567e-04 eta 3:53:32
epoch [47/50] batch [1140/2000] time 2.056 (2.037) data 0.001 (0.001) loss 0.0270 (1.1356) lr 1.5567e-04 eta 3:52:50
epoch [47/50] batch [1160/2000] time 2.056 (2.037) data 0.000 (0.001) loss 1.2466 (1.1338) lr 1.5567e-04 eta 3:52:10
epoch [47/50] batch [1180/2000] time 1.979 (2.036) data 0.000 (0.001) loss 0.9465 (1.1332) lr 1.5567e-04 eta 3:51:28
epoch [47/50] batch [1200/2000] time 2.061 (2.036) data 0.000 (0.001) loss 0.3114 (1.1348) lr 1.5567e-04 eta 3:50:48
epoch [47/50] batch [1220/2000] time 2.037 (2.037) data 0.000 (0.001) loss 0.0475 (1.1358) lr 1.5567e-04 eta 3:50:08
epoch [47/50] batch [1240/2000] time 2.004 (2.037) data 0.000 (0.001) loss 3.5274 (1.1354) lr 1.5567e-04 eta 3:49:27
epoch [47/50] batch [1260/2000] time 2.009 (2.037) data 0.000 (0.001) loss 1.0321 (1.1388) lr 1.5567e-04 eta 3:48:46
epoch [47/50] batch [1280/2000] time 2.062 (2.037) data 0.000 (0.001) loss 1.5254 (1.1382) lr 1.5567e-04 eta 3:48:06
epoch [47/50] batch [1300/2000] time 2.037 (2.037) data 0.000 (0.001) loss 0.8159 (1.1370) lr 1.5567e-04 eta 3:47:26
epoch [47/50] batch [1320/2000] time 2.038 (2.037) data 0.000 (0.001) loss 0.0244 (1.1330) lr 1.5567e-04 eta 3:46:45
epoch [47/50] batch [1340/2000] time 2.041 (2.037) data 0.000 (0.001) loss 2.0013 (1.1360) lr 1.5567e-04 eta 3:46:04
epoch [47/50] batch [1360/2000] time 2.044 (2.037) data 0.000 (0.001) loss 1.3550 (1.1347) lr 1.5567e-04 eta 3:45:23
epoch [47/50] batch [1380/2000] time 2.059 (2.037) data 0.000 (0.001) loss 1.0359 (1.1357) lr 1.5567e-04 eta 3:44:44
epoch [47/50] batch [1400/2000] time 2.037 (2.037) data 0.000 (0.001) loss 1.6100 (1.1337) lr 1.5567e-04 eta 3:44:03
epoch [47/50] batch [1420/2000] time 2.062 (2.037) data 0.000 (0.001) loss 1.7518 (1.1382) lr 1.5567e-04 eta 3:43:23
epoch [47/50] batch [1440/2000] time 2.038 (2.037) data 0.000 (0.001) loss 1.2005 (1.1406) lr 1.5567e-04 eta 3:42:42
epoch [47/50] batch [1460/2000] time 2.065 (2.037) data 0.000 (0.001) loss 0.2053 (1.1416) lr 1.5567e-04 eta 3:42:01
epoch [47/50] batch [1480/2000] time 2.036 (2.037) data 0.000 (0.001) loss 0.6018 (1.1429) lr 1.5567e-04 eta 3:41:21
epoch [47/50] batch [1500/2000] time 2.057 (2.037) data 0.000 (0.001) loss 1.7704 (1.1463) lr 1.5567e-04 eta 3:40:40
epoch [47/50] batch [1520/2000] time 2.057 (2.037) data 0.000 (0.001) loss 1.0436 (1.1446) lr 1.5567e-04 eta 3:39:59
epoch [47/50] batch [1540/2000] time 2.032 (2.037) data 0.000 (0.001) loss 0.3821 (1.1432) lr 1.5567e-04 eta 3:39:18
epoch [47/50] batch [1560/2000] time 2.060 (2.037) data 0.000 (0.001) loss 0.1358 (1.1421) lr 1.5567e-04 eta 3:38:38
epoch [47/50] batch [1580/2000] time 2.000 (2.037) data 0.000 (0.001) loss 0.4015 (1.1399) lr 1.5567e-04 eta 3:37:57
epoch [47/50] batch [1600/2000] time 2.060 (2.037) data 0.000 (0.001) loss 0.8462 (1.1396) lr 1.5567e-04 eta 3:37:16
epoch [47/50] batch [1620/2000] time 2.033 (2.037) data 0.000 (0.001) loss 0.0717 (1.1379) lr 1.5567e-04 eta 3:36:34
epoch [47/50] batch [1640/2000] time 2.000 (2.037) data 0.000 (0.001) loss 0.2154 (1.1362) lr 1.5567e-04 eta 3:35:53
epoch [47/50] batch [1660/2000] time 2.058 (2.037) data 0.000 (0.001) loss 0.8415 (1.1378) lr 1.5567e-04 eta 3:35:13
epoch [47/50] batch [1680/2000] time 2.060 (2.037) data 0.001 (0.001) loss 0.9472 (1.1388) lr 1.5567e-04 eta 3:34:32
epoch [47/50] batch [1700/2000] time 2.001 (2.037) data 0.000 (0.001) loss 0.5474 (1.1424) lr 1.5567e-04 eta 3:33:51
epoch [47/50] batch [1720/2000] time 2.057 (2.037) data 0.000 (0.001) loss 1.7551 (1.1401) lr 1.5567e-04 eta 3:33:10
epoch [47/50] batch [1740/2000] time 2.055 (2.037) data 0.000 (0.001) loss 0.5033 (1.1367) lr 1.5567e-04 eta 3:32:29
epoch [47/50] batch [1760/2000] time 2.033 (2.037) data 0.000 (0.001) loss 0.7249 (1.1330) lr 1.5567e-04 eta 3:31:47
epoch [47/50] batch [1780/2000] time 2.003 (2.036) data 0.000 (0.001) loss 0.4328 (1.1298) lr 1.5567e-04 eta 3:31:06
epoch [47/50] batch [1800/2000] time 2.058 (2.036) data 0.000 (0.001) loss 1.8546 (1.1307) lr 1.5567e-04 eta 3:30:26
epoch [47/50] batch [1820/2000] time 2.006 (2.036) data 0.000 (0.001) loss 0.7136 (1.1310) lr 1.5567e-04 eta 3:29:45
epoch [47/50] batch [1840/2000] time 2.056 (2.036) data 0.000 (0.001) loss 1.6670 (1.1337) lr 1.5567e-04 eta 3:29:04
epoch [47/50] batch [1860/2000] time 2.000 (2.036) data 0.000 (0.001) loss 0.2959 (1.1316) lr 1.5567e-04 eta 3:28:23
epoch [47/50] batch [1880/2000] time 2.057 (2.036) data 0.000 (0.001) loss 0.5101 (1.1301) lr 1.5567e-04 eta 3:27:41
epoch [47/50] batch [1900/2000] time 2.003 (2.036) data 0.000 (0.001) loss 1.0342 (1.1292) lr 1.5567e-04 eta 3:27:01
epoch [47/50] batch [1920/2000] time 2.057 (2.036) data 0.000 (0.001) loss 0.6898 (1.1269) lr 1.5567e-04 eta 3:26:20
epoch [47/50] batch [1940/2000] time 2.013 (2.036) data 0.000 (0.001) loss 1.3538 (1.1291) lr 1.5567e-04 eta 3:25:39
epoch [47/50] batch [1960/2000] time 2.058 (2.036) data 0.000 (0.001) loss 0.2846 (1.1277) lr 1.5567e-04 eta 3:24:59
epoch [47/50] batch [1980/2000] time 2.038 (2.036) data 0.000 (0.001) loss 0.3045 (1.1285) lr 1.5567e-04 eta 3:24:18
epoch [47/50] batch [2000/2000] time 2.035 (2.036) data 0.000 (0.001) loss 1.0841 (1.1339) lr 1.2369e-04 eta 3:23:37
epoch [48/50] batch [20/2000] time 1.974 (2.067) data 0.000 (0.035) loss 1.7948 (1.1125) lr 1.2369e-04 eta 3:25:59
epoch [48/50] batch [40/2000] time 2.062 (2.056) data 0.000 (0.017) loss 0.7697 (1.1045) lr 1.2369e-04 eta 3:24:13
epoch [48/50] batch [60/2000] time 2.006 (2.048) data 0.001 (0.012) loss 1.4415 (1.0622) lr 1.2369e-04 eta 3:22:46
epoch [48/50] batch [80/2000] time 2.032 (2.045) data 0.000 (0.009) loss 0.9038 (1.0790) lr 1.2369e-04 eta 3:21:45
epoch [48/50] batch [100/2000] time 1.976 (2.039) data 0.000 (0.007) loss 0.6162 (1.0226) lr 1.2369e-04 eta 3:20:32
epoch [48/50] batch [120/2000] time 1.998 (2.038) data 0.000 (0.006) loss 2.2078 (1.1316) lr 1.2369e-04 eta 3:19:41
epoch [48/50] batch [140/2000] time 2.038 (2.036) data 0.000 (0.005) loss 1.7440 (1.1316) lr 1.2369e-04 eta 3:18:52
epoch [48/50] batch [160/2000] time 2.003 (2.036) data 0.000 (0.005) loss 3.9650 (1.2046) lr 1.2369e-04 eta 3:18:09
epoch [48/50] batch [180/2000] time 2.064 (2.035) data 0.000 (0.004) loss 0.8289 (1.1991) lr 1.2369e-04 eta 3:17:25
epoch [48/50] batch [200/2000] time 2.002 (2.035) data 0.000 (0.004) loss 0.1078 (1.1865) lr 1.2369e-04 eta 3:16:43
epoch [48/50] batch [220/2000] time 2.059 (2.035) data 0.000 (0.003) loss 0.5257 (1.1916) lr 1.2369e-04 eta 3:16:01
epoch [48/50] batch [240/2000] time 2.033 (2.034) data 0.000 (0.003) loss 2.6339 (1.2141) lr 1.2369e-04 eta 3:15:15
epoch [48/50] batch [260/2000] time 1.976 (2.034) data 0.000 (0.003) loss 1.3574 (1.2103) lr 1.2369e-04 eta 3:14:35
epoch [48/50] batch [280/2000] time 2.058 (2.034) data 0.000 (0.003) loss 2.1873 (1.1940) lr 1.2369e-04 eta 3:13:55
epoch [48/50] batch [300/2000] time 2.058 (2.034) data 0.000 (0.003) loss 0.5164 (1.1813) lr 1.2369e-04 eta 3:13:15
epoch [48/50] batch [320/2000] time 2.054 (2.034) data 0.000 (0.002) loss 0.6533 (1.1807) lr 1.2369e-04 eta 3:12:32
epoch [48/50] batch [340/2000] time 2.051 (2.034) data 0.000 (0.002) loss 1.0816 (1.1710) lr 1.2369e-04 eta 3:11:51
epoch [48/50] batch [360/2000] time 2.003 (2.034) data 0.000 (0.002) loss 1.3852 (1.1769) lr 1.2369e-04 eta 3:11:10
epoch [48/50] batch [380/2000] time 2.033 (2.034) data 0.000 (0.002) loss 0.9969 (1.1755) lr 1.2369e-04 eta 3:10:29
epoch [48/50] batch [400/2000] time 2.057 (2.034) data 0.000 (0.002) loss 0.9592 (1.1785) lr 1.2369e-04 eta 3:09:49
epoch [48/50] batch [420/2000] time 2.063 (2.034) data 0.000 (0.002) loss 0.1835 (1.1689) lr 1.2369e-04 eta 3:09:09
epoch [48/50] batch [440/2000] time 2.062 (2.034) data 0.000 (0.002) loss 2.2285 (1.1692) lr 1.2369e-04 eta 3:08:29
epoch [48/50] batch [460/2000] time 2.036 (2.035) data 0.000 (0.002) loss 0.8424 (1.1549) lr 1.2369e-04 eta 3:07:51
epoch [48/50] batch [480/2000] time 2.060 (2.035) data 0.000 (0.002) loss 1.9003 (1.1523) lr 1.2369e-04 eta 3:07:12
epoch [48/50] batch [500/2000] time 2.036 (2.035) data 0.000 (0.002) loss 0.4605 (1.1561) lr 1.2369e-04 eta 3:06:32
epoch [48/50] batch [520/2000] time 1.997 (2.035) data 0.000 (0.002) loss 0.5481 (1.1505) lr 1.2369e-04 eta 3:05:49
epoch [48/50] batch [540/2000] time 2.056 (2.035) data 0.000 (0.002) loss 0.8170 (1.1712) lr 1.2369e-04 eta 3:05:08
epoch [48/50] batch [560/2000] time 2.000 (2.034) data 0.000 (0.001) loss 3.0413 (1.1815) lr 1.2369e-04 eta 3:04:25
epoch [48/50] batch [580/2000] time 2.054 (2.034) data 0.000 (0.001) loss 0.4708 (1.1771) lr 1.2369e-04 eta 3:03:44
epoch [48/50] batch [600/2000] time 2.032 (2.034) data 0.001 (0.001) loss 0.6229 (1.1690) lr 1.2369e-04 eta 3:03:03
epoch [48/50] batch [620/2000] time 2.039 (2.034) data 0.000 (0.001) loss 0.7344 (1.1730) lr 1.2369e-04 eta 3:02:23
epoch [48/50] batch [640/2000] time 2.070 (2.034) data 0.000 (0.001) loss 0.6280 (1.1645) lr 1.2369e-04 eta 3:01:42
epoch [48/50] batch [660/2000] time 2.007 (2.034) data 0.000 (0.001) loss 0.1912 (1.1649) lr 1.2369e-04 eta 3:01:03
epoch [48/50] batch [680/2000] time 1.981 (2.034) data 0.000 (0.001) loss 1.7036 (1.1709) lr 1.2369e-04 eta 3:00:23
epoch [48/50] batch [700/2000] time 1.976 (2.034) data 0.000 (0.001) loss 1.3536 (1.1732) lr 1.2369e-04 eta 2:59:41
epoch [48/50] batch [720/2000] time 1.998 (2.034) data 0.000 (0.001) loss 1.1784 (1.1822) lr 1.2369e-04 eta 2:59:01
epoch [48/50] batch [740/2000] time 2.033 (2.034) data 0.000 (0.001) loss 1.0875 (1.1715) lr 1.2369e-04 eta 2:58:21
epoch [48/50] batch [760/2000] time 2.032 (2.034) data 0.000 (0.001) loss 1.0117 (1.1727) lr 1.2369e-04 eta 2:57:39
epoch [48/50] batch [780/2000] time 2.054 (2.034) data 0.000 (0.001) loss 1.5978 (1.1659) lr 1.2369e-04 eta 2:56:59
epoch [48/50] batch [800/2000] time 2.029 (2.034) data 0.000 (0.001) loss 2.0638 (1.1705) lr 1.2369e-04 eta 2:56:18
epoch [48/50] batch [820/2000] time 2.053 (2.034) data 0.000 (0.001) loss 2.5534 (1.1722) lr 1.2369e-04 eta 2:55:37
epoch [48/50] batch [840/2000] time 2.000 (2.034) data 0.000 (0.001) loss 1.5863 (1.1818) lr 1.2369e-04 eta 2:54:57
epoch [48/50] batch [860/2000] time 2.059 (2.035) data 0.000 (0.001) loss 1.0640 (1.1772) lr 1.2369e-04 eta 2:54:17
epoch [48/50] batch [880/2000] time 2.055 (2.034) data 0.000 (0.001) loss 1.0248 (1.1768) lr 1.2369e-04 eta 2:53:35
epoch [48/50] batch [900/2000] time 2.059 (2.034) data 0.000 (0.001) loss 0.7855 (1.1786) lr 1.2369e-04 eta 2:52:55
epoch [48/50] batch [920/2000] time 2.006 (2.034) data 0.000 (0.001) loss 0.6718 (1.1706) lr 1.2369e-04 eta 2:52:15
epoch [48/50] batch [940/2000] time 2.065 (2.035) data 0.000 (0.001) loss 0.1981 (1.1731) lr 1.2369e-04 eta 2:51:35
epoch [48/50] batch [960/2000] time 1.982 (2.035) data 0.000 (0.001) loss 0.3805 (1.1721) lr 1.2369e-04 eta 2:50:54
epoch [48/50] batch [980/2000] time 2.037 (2.035) data 0.000 (0.001) loss 0.8655 (1.1662) lr 1.2369e-04 eta 2:50:14
epoch [48/50] batch [1000/2000] time 2.063 (2.035) data 0.000 (0.001) loss 0.4848 (1.1632) lr 1.2369e-04 eta 2:49:34
epoch [48/50] batch [1020/2000] time 2.062 (2.035) data 0.000 (0.001) loss 1.3566 (1.1643) lr 1.2369e-04 eta 2:48:54
epoch [48/50] batch [1040/2000] time 2.063 (2.035) data 0.000 (0.001) loss 0.2282 (1.1605) lr 1.2369e-04 eta 2:48:14
epoch [48/50] batch [1060/2000] time 2.034 (2.035) data 0.000 (0.001) loss 1.6405 (1.1601) lr 1.2369e-04 eta 2:47:34
epoch [48/50] batch [1080/2000] time 2.059 (2.035) data 0.000 (0.001) loss 0.4477 (1.1561) lr 1.2369e-04 eta 2:46:53
epoch [48/50] batch [1100/2000] time 2.059 (2.035) data 0.000 (0.001) loss 0.0520 (1.1569) lr 1.2369e-04 eta 2:46:12
epoch [48/50] batch [1120/2000] time 1.996 (2.035) data 0.000 (0.001) loss 1.0153 (1.1522) lr 1.2369e-04 eta 2:45:32
epoch [48/50] batch [1140/2000] time 2.053 (2.035) data 0.001 (0.001) loss 0.0203 (1.1512) lr 1.2369e-04 eta 2:44:51
epoch [48/50] batch [1160/2000] time 1.996 (2.035) data 0.000 (0.001) loss 2.0691 (1.1524) lr 1.2369e-04 eta 2:44:09
epoch [48/50] batch [1180/2000] time 2.030 (2.035) data 0.000 (0.001) loss 0.9090 (1.1553) lr 1.2369e-04 eta 2:43:28
epoch [48/50] batch [1200/2000] time 1.998 (2.035) data 0.000 (0.001) loss 0.6259 (1.1512) lr 1.2369e-04 eta 2:42:47
epoch [48/50] batch [1220/2000] time 2.054 (2.035) data 0.000 (0.001) loss 0.5713 (1.1532) lr 1.2369e-04 eta 2:42:06
epoch [48/50] batch [1240/2000] time 2.053 (2.035) data 0.000 (0.001) loss 0.3265 (1.1535) lr 1.2369e-04 eta 2:41:24
epoch [48/50] batch [1260/2000] time 2.054 (2.035) data 0.000 (0.001) loss 1.5458 (1.1539) lr 1.2369e-04 eta 2:40:44
epoch [48/50] batch [1280/2000] time 2.032 (2.035) data 0.000 (0.001) loss 0.1701 (1.1548) lr 1.2369e-04 eta 2:40:03
epoch [48/50] batch [1300/2000] time 2.060 (2.035) data 0.000 (0.001) loss 1.0261 (1.1514) lr 1.2369e-04 eta 2:39:22
epoch [48/50] batch [1320/2000] time 2.000 (2.035) data 0.000 (0.001) loss 1.9518 (1.1555) lr 1.2369e-04 eta 2:38:42
epoch [48/50] batch [1340/2000] time 2.038 (2.035) data 0.001 (0.001) loss 1.1481 (1.1515) lr 1.2369e-04 eta 2:38:01
epoch [48/50] batch [1360/2000] time 2.003 (2.035) data 0.000 (0.001) loss 1.5266 (1.1484) lr 1.2369e-04 eta 2:37:21
epoch [48/50] batch [1380/2000] time 2.005 (2.035) data 0.000 (0.001) loss 0.0904 (1.1443) lr 1.2369e-04 eta 2:36:40
epoch [48/50] batch [1400/2000] time 1.979 (2.035) data 0.000 (0.001) loss 0.1216 (1.1424) lr 1.2369e-04 eta 2:36:00
epoch [48/50] batch [1420/2000] time 2.064 (2.035) data 0.000 (0.001) loss 0.1915 (1.1434) lr 1.2369e-04 eta 2:35:20
epoch [48/50] batch [1440/2000] time 2.036 (2.035) data 0.000 (0.001) loss 3.9136 (1.1462) lr 1.2369e-04 eta 2:34:39
epoch [48/50] batch [1460/2000] time 2.057 (2.035) data 0.000 (0.001) loss 2.5373 (1.1456) lr 1.2369e-04 eta 2:33:58
epoch [48/50] batch [1480/2000] time 2.002 (2.035) data 0.000 (0.001) loss 0.2302 (1.1434) lr 1.2369e-04 eta 2:33:18
epoch [48/50] batch [1500/2000] time 2.056 (2.035) data 0.000 (0.001) loss 0.6395 (1.1411) lr 1.2369e-04 eta 2:32:37
epoch [48/50] batch [1520/2000] time 1.977 (2.035) data 0.000 (0.001) loss 0.8800 (1.1465) lr 1.2369e-04 eta 2:31:56
epoch [48/50] batch [1540/2000] time 2.057 (2.035) data 0.000 (0.001) loss 0.5401 (1.1456) lr 1.2369e-04 eta 2:31:15
epoch [48/50] batch [1560/2000] time 2.056 (2.035) data 0.000 (0.001) loss 0.4100 (1.1451) lr 1.2369e-04 eta 2:30:35
epoch [48/50] batch [1580/2000] time 2.054 (2.035) data 0.000 (0.001) loss 0.2067 (1.1467) lr 1.2369e-04 eta 2:29:53
epoch [48/50] batch [1600/2000] time 2.054 (2.035) data 0.000 (0.001) loss 0.2076 (1.1453) lr 1.2369e-04 eta 2:29:13
epoch [48/50] batch [1620/2000] time 2.060 (2.035) data 0.000 (0.001) loss 0.0514 (1.1477) lr 1.2369e-04 eta 2:28:32
epoch [48/50] batch [1640/2000] time 2.064 (2.035) data 0.000 (0.001) loss 0.4160 (1.1467) lr 1.2369e-04 eta 2:27:51
epoch [48/50] batch [1660/2000] time 2.057 (2.035) data 0.000 (0.001) loss 1.0831 (1.1479) lr 1.2369e-04 eta 2:27:10
epoch [48/50] batch [1680/2000] time 2.009 (2.035) data 0.001 (0.001) loss 0.0130 (1.1461) lr 1.2369e-04 eta 2:26:29
epoch [48/50] batch [1700/2000] time 2.000 (2.035) data 0.000 (0.001) loss 0.7990 (1.1435) lr 1.2369e-04 eta 2:25:49
epoch [48/50] batch [1720/2000] time 2.034 (2.035) data 0.000 (0.001) loss 1.2658 (1.1403) lr 1.2369e-04 eta 2:25:08
epoch [48/50] batch [1740/2000] time 2.060 (2.035) data 0.000 (0.001) loss 0.6439 (1.1384) lr 1.2369e-04 eta 2:24:27
epoch [48/50] batch [1760/2000] time 2.057 (2.035) data 0.000 (0.001) loss 0.9910 (1.1349) lr 1.2369e-04 eta 2:23:47
epoch [48/50] batch [1780/2000] time 2.032 (2.035) data 0.000 (0.001) loss 1.5057 (1.1352) lr 1.2369e-04 eta 2:23:06
epoch [48/50] batch [1800/2000] time 2.057 (2.035) data 0.000 (0.001) loss 0.1709 (1.1334) lr 1.2369e-04 eta 2:22:26
epoch [48/50] batch [1820/2000] time 2.056 (2.035) data 0.000 (0.001) loss 1.4179 (1.1352) lr 1.2369e-04 eta 2:21:45
epoch [48/50] batch [1840/2000] time 2.057 (2.035) data 0.000 (0.001) loss 0.3115 (1.1343) lr 1.2369e-04 eta 2:21:04
epoch [48/50] batch [1860/2000] time 2.032 (2.035) data 0.000 (0.001) loss 0.9589 (1.1347) lr 1.2369e-04 eta 2:20:23
epoch [48/50] batch [1880/2000] time 2.031 (2.035) data 0.000 (0.001) loss 0.8927 (1.1380) lr 1.2369e-04 eta 2:19:42
epoch [48/50] batch [1900/2000] time 2.035 (2.035) data 0.000 (0.001) loss 0.8259 (1.1375) lr 1.2369e-04 eta 2:19:01
epoch [48/50] batch [1920/2000] time 2.060 (2.035) data 0.002 (0.001) loss 1.9742 (1.1348) lr 1.2369e-04 eta 2:18:21
epoch [48/50] batch [1940/2000] time 2.032 (2.035) data 0.000 (0.001) loss 0.0551 (1.1371) lr 1.2369e-04 eta 2:17:40
epoch [48/50] batch [1960/2000] time 1.996 (2.035) data 0.000 (0.001) loss 3.4230 (1.1363) lr 1.2369e-04 eta 2:16:59
epoch [48/50] batch [1980/2000] time 2.029 (2.035) data 0.000 (0.001) loss 0.4980 (1.1333) lr 1.2369e-04 eta 2:16:18
epoch [48/50] batch [2000/2000] time 1.997 (2.034) data 0.000 (0.001) loss 0.9119 (1.1386) lr 9.5173e-05 eta 2:15:37
epoch [49/50] batch [20/2000] time 1.974 (2.064) data 0.000 (0.035) loss 2.5612 (1.5211) lr 9.5173e-05 eta 2:16:55
epoch [49/50] batch [40/2000] time 2.003 (2.047) data 0.000 (0.017) loss 1.5243 (1.4160) lr 9.5173e-05 eta 2:15:04
epoch [49/50] batch [60/2000] time 2.027 (2.041) data 0.001 (0.012) loss 0.6742 (1.3080) lr 9.5173e-05 eta 2:14:03
epoch [49/50] batch [80/2000] time 2.049 (2.039) data 0.000 (0.009) loss 0.2319 (1.3193) lr 9.5173e-05 eta 2:13:12
epoch [49/50] batch [100/2000] time 2.056 (2.035) data 0.000 (0.007) loss 0.7397 (1.1819) lr 9.5173e-05 eta 2:12:17
epoch [49/50] batch [120/2000] time 2.071 (2.035) data 0.000 (0.006) loss 1.4548 (1.2179) lr 9.5173e-05 eta 2:11:34
epoch [49/50] batch [140/2000] time 2.057 (2.035) data 0.000 (0.005) loss 0.8324 (1.1952) lr 9.5173e-05 eta 2:10:55
epoch [49/50] batch [160/2000] time 2.061 (2.034) data 0.000 (0.005) loss 3.6076 (1.2169) lr 9.5173e-05 eta 2:10:10
epoch [49/50] batch [180/2000] time 2.058 (2.034) data 0.000 (0.004) loss 1.3034 (1.2447) lr 9.5173e-05 eta 2:09:31
epoch [49/50] batch [200/2000] time 2.035 (2.035) data 0.000 (0.004) loss 0.7375 (1.2158) lr 9.5173e-05 eta 2:08:51
epoch [49/50] batch [220/2000] time 2.004 (2.034) data 0.000 (0.003) loss 0.4050 (1.2147) lr 9.5173e-05 eta 2:08:10
epoch [49/50] batch [240/2000] time 2.036 (2.035) data 0.000 (0.003) loss 0.3065 (1.1815) lr 9.5173e-05 eta 2:07:31
epoch [49/50] batch [260/2000] time 2.004 (2.035) data 0.000 (0.003) loss 1.4453 (1.1605) lr 9.5173e-05 eta 2:06:49
epoch [49/50] batch [280/2000] time 2.004 (2.035) data 0.000 (0.003) loss 0.3520 (1.1367) lr 9.5173e-05 eta 2:06:08
epoch [49/50] batch [300/2000] time 2.027 (2.034) data 0.000 (0.003) loss 3.1901 (1.1554) lr 9.5173e-05 eta 2:05:26
epoch [49/50] batch [320/2000] time 2.027 (2.034) data 0.000 (0.002) loss 1.0048 (1.1683) lr 9.5173e-05 eta 2:04:46
epoch [49/50] batch [340/2000] time 1.999 (2.034) data 0.000 (0.002) loss 2.8962 (1.1858) lr 9.5173e-05 eta 2:04:05
epoch [49/50] batch [360/2000] time 2.035 (2.034) data 0.000 (0.002) loss 0.3880 (1.1931) lr 9.5173e-05 eta 2:03:24
epoch [49/50] batch [380/2000] time 2.048 (2.034) data 0.000 (0.002) loss 1.8863 (1.2264) lr 9.5173e-05 eta 2:02:41
epoch [49/50] batch [400/2000] time 2.049 (2.033) data 0.000 (0.002) loss 0.2302 (1.2123) lr 9.5173e-05 eta 2:01:59
epoch [49/50] batch [420/2000] time 2.051 (2.033) data 0.000 (0.002) loss 0.3326 (1.1947) lr 9.5173e-05 eta 2:01:19
epoch [49/50] batch [440/2000] time 2.049 (2.033) data 0.000 (0.002) loss 1.6747 (1.2046) lr 9.5173e-05 eta 2:00:38
epoch [49/50] batch [460/2000] time 2.052 (2.033) data 0.000 (0.002) loss 0.8097 (1.1866) lr 9.5173e-05 eta 1:59:56
epoch [49/50] batch [480/2000] time 2.053 (2.033) data 0.000 (0.002) loss 1.0247 (1.1668) lr 9.5173e-05 eta 1:59:15
epoch [49/50] batch [500/2000] time 2.060 (2.033) data 0.000 (0.002) loss 0.7128 (1.1732) lr 9.5173e-05 eta 1:58:35
epoch [49/50] batch [520/2000] time 2.053 (2.033) data 0.000 (0.002) loss 1.3903 (1.1700) lr 9.5173e-05 eta 1:57:54
epoch [49/50] batch [540/2000] time 1.975 (2.033) data 0.000 (0.002) loss 1.7279 (1.1657) lr 9.5173e-05 eta 1:57:14
epoch [49/50] batch [560/2000] time 2.051 (2.033) data 0.000 (0.001) loss 0.5115 (1.1541) lr 9.5173e-05 eta 1:56:32
epoch [49/50] batch [580/2000] time 2.056 (2.033) data 0.000 (0.001) loss 1.0154 (1.1515) lr 9.5173e-05 eta 1:55:52
epoch [49/50] batch [600/2000] time 1.997 (2.033) data 0.000 (0.001) loss 0.8222 (1.1520) lr 9.5173e-05 eta 1:55:11
epoch [49/50] batch [620/2000] time 2.055 (2.033) data 0.000 (0.001) loss 0.0659 (1.1446) lr 9.5173e-05 eta 1:54:31
epoch [49/50] batch [640/2000] time 1.977 (2.033) data 0.000 (0.001) loss 1.2742 (1.1551) lr 9.5173e-05 eta 1:53:50
epoch [49/50] batch [660/2000] time 1.998 (2.033) data 0.000 (0.001) loss 0.5051 (1.1524) lr 9.5173e-05 eta 1:53:08
epoch [49/50] batch [680/2000] time 2.032 (2.033) data 0.000 (0.001) loss 0.3295 (1.1606) lr 9.5173e-05 eta 1:52:28
epoch [49/50] batch [700/2000] time 2.053 (2.032) data 0.000 (0.001) loss 0.0392 (1.1562) lr 9.5173e-05 eta 1:51:47
epoch [49/50] batch [720/2000] time 1.976 (2.032) data 0.000 (0.001) loss 1.3624 (1.1487) lr 9.5173e-05 eta 1:51:05
epoch [49/50] batch [740/2000] time 1.995 (2.032) data 0.000 (0.001) loss 1.7321 (1.1463) lr 9.5173e-05 eta 1:50:24
epoch [49/50] batch [760/2000] time 2.052 (2.032) data 0.000 (0.001) loss 1.2106 (1.1488) lr 9.5173e-05 eta 1:49:43
epoch [49/50] batch [780/2000] time 2.048 (2.032) data 0.000 (0.001) loss 0.4139 (1.1488) lr 9.5173e-05 eta 1:49:02
epoch [49/50] batch [800/2000] time 2.052 (2.032) data 0.000 (0.001) loss 1.6901 (1.1478) lr 9.5173e-05 eta 1:48:21
epoch [49/50] batch [820/2000] time 1.999 (2.031) data 0.000 (0.001) loss 0.7446 (1.1496) lr 9.5173e-05 eta 1:47:39
epoch [49/50] batch [840/2000] time 2.055 (2.032) data 0.000 (0.001) loss 0.4101 (1.1488) lr 9.5173e-05 eta 1:46:59
epoch [49/50] batch [860/2000] time 2.058 (2.032) data 0.000 (0.001) loss 0.0749 (1.1517) lr 9.5173e-05 eta 1:46:19
epoch [49/50] batch [880/2000] time 2.054 (2.032) data 0.000 (0.001) loss 0.1026 (1.1458) lr 9.5173e-05 eta 1:45:38
epoch [49/50] batch [900/2000] time 2.002 (2.032) data 0.000 (0.001) loss 1.2140 (1.1544) lr 9.5173e-05 eta 1:44:58
epoch [49/50] batch [920/2000] time 2.002 (2.032) data 0.000 (0.001) loss 0.0155 (1.1548) lr 9.5173e-05 eta 1:44:17
epoch [49/50] batch [940/2000] time 2.048 (2.032) data 0.000 (0.001) loss 0.6519 (1.1581) lr 9.5173e-05 eta 1:43:37
epoch [49/50] batch [960/2000] time 2.027 (2.031) data 0.000 (0.001) loss 0.6145 (1.1537) lr 9.5173e-05 eta 1:42:55
epoch [49/50] batch [980/2000] time 2.048 (2.031) data 0.000 (0.001) loss 0.2561 (1.1535) lr 9.5173e-05 eta 1:42:14
epoch [49/50] batch [1000/2000] time 2.051 (2.031) data 0.000 (0.001) loss 3.9575 (1.1561) lr 9.5173e-05 eta 1:41:33
epoch [49/50] batch [1020/2000] time 2.054 (2.031) data 0.000 (0.001) loss 2.6182 (1.1518) lr 9.5173e-05 eta 1:40:53
epoch [49/50] batch [1040/2000] time 1.975 (2.031) data 0.000 (0.001) loss 3.5564 (1.1564) lr 9.5173e-05 eta 1:40:12
epoch [49/50] batch [1060/2000] time 2.002 (2.031) data 0.000 (0.001) loss 0.3034 (1.1625) lr 9.5173e-05 eta 1:39:31
epoch [49/50] batch [1080/2000] time 2.051 (2.031) data 0.000 (0.001) loss 0.9482 (1.1622) lr 9.5173e-05 eta 1:38:50
epoch [49/50] batch [1100/2000] time 2.053 (2.031) data 0.000 (0.001) loss 0.6993 (1.1585) lr 9.5173e-05 eta 1:38:09
epoch [49/50] batch [1120/2000] time 2.047 (2.031) data 0.000 (0.001) loss 0.2953 (1.1681) lr 9.5173e-05 eta 1:37:28
epoch [49/50] batch [1140/2000] time 2.026 (2.031) data 0.001 (0.001) loss 1.1841 (1.1667) lr 9.5173e-05 eta 1:36:47
epoch [49/50] batch [1160/2000] time 2.003 (2.030) data 0.000 (0.001) loss 0.9835 (1.1689) lr 9.5173e-05 eta 1:36:06
epoch [49/50] batch [1180/2000] time 2.051 (2.031) data 0.000 (0.001) loss 1.7919 (1.1651) lr 9.5173e-05 eta 1:35:26
epoch [49/50] batch [1200/2000] time 1.975 (2.030) data 0.000 (0.001) loss 0.0505 (1.1664) lr 9.5173e-05 eta 1:34:45
epoch [49/50] batch [1220/2000] time 1.999 (2.030) data 0.000 (0.001) loss 1.9848 (1.1627) lr 9.5173e-05 eta 1:34:04
epoch [49/50] batch [1240/2000] time 1.998 (2.030) data 0.000 (0.001) loss 0.2961 (1.1611) lr 9.5173e-05 eta 1:33:24
epoch [49/50] batch [1260/2000] time 1.999 (2.030) data 0.000 (0.001) loss 0.4607 (1.1592) lr 9.5173e-05 eta 1:32:43
epoch [49/50] batch [1280/2000] time 2.050 (2.030) data 0.000 (0.001) loss 1.2818 (1.1606) lr 9.5173e-05 eta 1:32:02
epoch [49/50] batch [1300/2000] time 1.975 (2.030) data 0.000 (0.001) loss 1.1535 (1.1548) lr 9.5173e-05 eta 1:31:21
epoch [49/50] batch [1320/2000] time 2.031 (2.030) data 0.000 (0.001) loss 0.0974 (1.1528) lr 9.5173e-05 eta 1:30:41
epoch [49/50] batch [1340/2000] time 1.999 (2.030) data 0.000 (0.001) loss 1.8029 (1.1510) lr 9.5173e-05 eta 1:30:00
epoch [49/50] batch [1360/2000] time 2.025 (2.030) data 0.000 (0.001) loss 1.8531 (1.1518) lr 9.5173e-05 eta 1:29:20
epoch [49/50] batch [1380/2000] time 1.995 (2.030) data 0.000 (0.001) loss 1.7528 (1.1549) lr 9.5173e-05 eta 1:28:39
epoch [49/50] batch [1400/2000] time 2.058 (2.030) data 0.000 (0.001) loss 0.2424 (1.1545) lr 9.5173e-05 eta 1:27:58
epoch [49/50] batch [1420/2000] time 1.974 (2.030) data 0.000 (0.001) loss 0.6590 (1.1512) lr 9.5173e-05 eta 1:27:17
epoch [49/50] batch [1440/2000] time 2.055 (2.030) data 0.000 (0.001) loss 0.1775 (1.1473) lr 9.5173e-05 eta 1:26:37
epoch [49/50] batch [1460/2000] time 2.001 (2.030) data 0.000 (0.001) loss 0.9437 (1.1506) lr 9.5173e-05 eta 1:25:57
epoch [49/50] batch [1480/2000] time 2.033 (2.030) data 0.000 (0.001) loss 1.3138 (1.1498) lr 9.5173e-05 eta 1:25:16
epoch [49/50] batch [1500/2000] time 2.062 (2.030) data 0.001 (0.001) loss 2.8587 (1.1485) lr 9.5173e-05 eta 1:24:36
epoch [49/50] batch [1520/2000] time 2.057 (2.031) data 0.000 (0.001) loss 0.4348 (1.1501) lr 9.5173e-05 eta 1:23:55
epoch [49/50] batch [1540/2000] time 2.032 (2.031) data 0.000 (0.001) loss 0.5232 (1.1498) lr 9.5173e-05 eta 1:23:15
epoch [49/50] batch [1560/2000] time 2.032 (2.031) data 0.000 (0.001) loss 1.2781 (1.1495) lr 9.5173e-05 eta 1:22:34
epoch [49/50] batch [1580/2000] time 2.055 (2.031) data 0.000 (0.001) loss 0.6332 (1.1500) lr 9.5173e-05 eta 1:21:54
epoch [49/50] batch [1600/2000] time 2.055 (2.031) data 0.000 (0.001) loss 0.3547 (1.1531) lr 9.5173e-05 eta 1:21:13
epoch [49/50] batch [1620/2000] time 1.995 (2.031) data 0.000 (0.001) loss 3.3917 (1.1564) lr 9.5173e-05 eta 1:20:32
epoch [49/50] batch [1640/2000] time 2.027 (2.031) data 0.000 (0.001) loss 0.7114 (1.1557) lr 9.5173e-05 eta 1:19:52
epoch [49/50] batch [1660/2000] time 2.029 (2.031) data 0.000 (0.001) loss 0.5703 (1.1532) lr 9.5173e-05 eta 1:19:11
epoch [49/50] batch [1680/2000] time 2.056 (2.031) data 0.001 (0.001) loss 0.2079 (1.1521) lr 9.5173e-05 eta 1:18:30
epoch [49/50] batch [1700/2000] time 2.002 (2.031) data 0.000 (0.001) loss 1.3210 (1.1508) lr 9.5173e-05 eta 1:17:50
epoch [49/50] batch [1720/2000] time 2.059 (2.031) data 0.000 (0.001) loss 3.4826 (1.1522) lr 9.5173e-05 eta 1:17:10
epoch [49/50] batch [1740/2000] time 2.055 (2.031) data 0.000 (0.001) loss 0.3756 (1.1512) lr 9.5173e-05 eta 1:16:29
epoch [49/50] batch [1760/2000] time 2.054 (2.031) data 0.000 (0.001) loss 2.0880 (1.1513) lr 9.5173e-05 eta 1:15:49
epoch [49/50] batch [1780/2000] time 2.055 (2.031) data 0.000 (0.001) loss 1.5724 (1.1533) lr 9.5173e-05 eta 1:15:08
epoch [49/50] batch [1800/2000] time 2.032 (2.031) data 0.000 (0.001) loss 0.0913 (1.1503) lr 9.5173e-05 eta 1:14:28
epoch [49/50] batch [1820/2000] time 2.030 (2.031) data 0.000 (0.001) loss 0.2473 (1.1466) lr 9.5173e-05 eta 1:13:47
epoch [49/50] batch [1840/2000] time 1.999 (2.031) data 0.000 (0.001) loss 0.7339 (1.1505) lr 9.5173e-05 eta 1:13:06
epoch [49/50] batch [1860/2000] time 1.973 (2.031) data 0.000 (0.001) loss 0.3763 (1.1488) lr 9.5173e-05 eta 1:12:26
epoch [49/50] batch [1880/2000] time 2.049 (2.031) data 0.000 (0.001) loss 0.3525 (1.1482) lr 9.5173e-05 eta 1:11:45
epoch [49/50] batch [1900/2000] time 2.051 (2.031) data 0.000 (0.001) loss 0.8834 (1.1501) lr 9.5173e-05 eta 1:11:05
epoch [49/50] batch [1920/2000] time 2.052 (2.031) data 0.000 (0.001) loss 2.2868 (1.1529) lr 9.5173e-05 eta 1:10:24
epoch [49/50] batch [1940/2000] time 2.053 (2.031) data 0.000 (0.001) loss 1.5497 (1.1501) lr 9.5173e-05 eta 1:09:43
epoch [49/50] batch [1960/2000] time 2.053 (2.031) data 0.000 (0.001) loss 1.0069 (1.1483) lr 9.5173e-05 eta 1:09:03
epoch [49/50] batch [1980/2000] time 2.001 (2.031) data 0.000 (0.001) loss 1.4688 (1.1518) lr 9.5173e-05 eta 1:08:22
epoch [49/50] batch [2000/2000] time 1.995 (2.031) data 0.000 (0.001) loss 0.6185 (1.1520) lr 7.0224e-05 eta 1:07:42
epoch [50/50] batch [20/2000] time 2.058 (2.073) data 0.000 (0.034) loss 0.2339 (1.3432) lr 7.0224e-05 eta 1:08:23
epoch [50/50] batch [40/2000] time 2.054 (2.049) data 0.000 (0.017) loss 2.2981 (1.3416) lr 7.0224e-05 eta 1:06:56
epoch [50/50] batch [60/2000] time 2.052 (2.041) data 0.001 (0.012) loss 0.2955 (1.2881) lr 7.0224e-05 eta 1:06:00
epoch [50/50] batch [80/2000] time 2.053 (2.040) data 0.000 (0.009) loss 3.2179 (1.2814) lr 7.0224e-05 eta 1:05:16
epoch [50/50] batch [100/2000] time 2.056 (2.038) data 0.000 (0.007) loss 0.1585 (1.2177) lr 7.0224e-05 eta 1:04:31
epoch [50/50] batch [120/2000] time 2.056 (2.037) data 0.000 (0.006) loss 0.9497 (1.1795) lr 7.0224e-05 eta 1:03:49
epoch [50/50] batch [140/2000] time 2.031 (2.036) data 0.000 (0.005) loss 0.7251 (1.2160) lr 7.0224e-05 eta 1:03:07
epoch [50/50] batch [160/2000] time 2.003 (2.036) data 0.000 (0.004) loss 0.7036 (1.1889) lr 7.0224e-05 eta 1:02:25
epoch [50/50] batch [180/2000] time 2.056 (2.036) data 0.000 (0.004) loss 0.7003 (1.1823) lr 7.0224e-05 eta 1:01:45
epoch [50/50] batch [200/2000] time 2.002 (2.035) data 0.000 (0.004) loss 0.4948 (1.1836) lr 7.0224e-05 eta 1:01:03
epoch [50/50] batch [220/2000] time 2.032 (2.035) data 0.000 (0.003) loss 0.1427 (1.1601) lr 7.0224e-05 eta 1:00:22
epoch [50/50] batch [240/2000] time 1.977 (2.035) data 0.000 (0.003) loss 1.7838 (1.1287) lr 7.0224e-05 eta 0:59:41
epoch [50/50] batch [260/2000] time 2.054 (2.035) data 0.000 (0.003) loss 0.5560 (1.1294) lr 7.0224e-05 eta 0:59:00
epoch [50/50] batch [280/2000] time 1.998 (2.035) data 0.000 (0.003) loss 3.5662 (1.1265) lr 7.0224e-05 eta 0:58:19
epoch [50/50] batch [300/2000] time 2.034 (2.035) data 0.000 (0.003) loss 0.0304 (1.1137) lr 7.0224e-05 eta 0:57:38
epoch [50/50] batch [320/2000] time 2.063 (2.034) data 0.000 (0.002) loss 0.0973 (1.1097) lr 7.0224e-05 eta 0:56:57
epoch [50/50] batch [340/2000] time 2.003 (2.034) data 0.000 (0.002) loss 0.3724 (1.1062) lr 7.0224e-05 eta 0:56:16
epoch [50/50] batch [360/2000] time 2.054 (2.034) data 0.000 (0.002) loss 2.4945 (1.0924) lr 7.0224e-05 eta 0:55:35
epoch [50/50] batch [380/2000] time 2.010 (2.034) data 0.000 (0.002) loss 1.5135 (1.1003) lr 7.0224e-05 eta 0:54:55
epoch [50/50] batch [400/2000] time 2.053 (2.034) data 0.000 (0.002) loss 1.0729 (1.0898) lr 7.0224e-05 eta 0:54:14
epoch [50/50] batch [420/2000] time 2.001 (2.034) data 0.000 (0.002) loss 1.2793 (1.0916) lr 7.0224e-05 eta 0:53:33
epoch [50/50] batch [440/2000] time 2.059 (2.034) data 0.000 (0.002) loss 1.1245 (1.0958) lr 7.0224e-05 eta 0:52:53
epoch [50/50] batch [460/2000] time 2.055 (2.034) data 0.000 (0.002) loss 0.2180 (1.0841) lr 7.0224e-05 eta 0:52:12
epoch [50/50] batch [480/2000] time 1.999 (2.034) data 0.000 (0.002) loss 1.1816 (1.0949) lr 7.0224e-05 eta 0:51:31
epoch [50/50] batch [500/2000] time 2.054 (2.034) data 0.000 (0.002) loss 0.5355 (1.0910) lr 7.0224e-05 eta 0:50:51
epoch [50/50] batch [520/2000] time 1.980 (2.034) data 0.000 (0.002) loss 0.4925 (1.0878) lr 7.0224e-05 eta 0:50:10
epoch [50/50] batch [540/2000] time 2.056 (2.034) data 0.000 (0.001) loss 2.1881 (1.0915) lr 7.0224e-05 eta 0:49:29
epoch [50/50] batch [560/2000] time 2.061 (2.034) data 0.000 (0.001) loss 1.1277 (1.0907) lr 7.0224e-05 eta 0:48:48
epoch [50/50] batch [580/2000] time 2.057 (2.034) data 0.000 (0.001) loss 0.6466 (1.0888) lr 7.0224e-05 eta 0:48:08
epoch [50/50] batch [600/2000] time 2.057 (2.034) data 0.001 (0.001) loss 1.3044 (1.0940) lr 7.0224e-05 eta 0:47:27
epoch [50/50] batch [620/2000] time 2.059 (2.034) data 0.000 (0.001) loss 1.2570 (1.1039) lr 7.0224e-05 eta 0:46:46
epoch [50/50] batch [640/2000] time 2.058 (2.034) data 0.000 (0.001) loss 1.1191 (1.1052) lr 7.0224e-05 eta 0:46:06
epoch [50/50] batch [660/2000] time 2.033 (2.034) data 0.000 (0.001) loss 1.8674 (1.1101) lr 7.0224e-05 eta 0:45:25
epoch [50/50] batch [680/2000] time 2.061 (2.034) data 0.000 (0.001) loss 1.9399 (1.1081) lr 7.0224e-05 eta 0:44:45
epoch [50/50] batch [700/2000] time 2.033 (2.034) data 0.000 (0.001) loss 1.6573 (1.1012) lr 7.0224e-05 eta 0:44:04
epoch [50/50] batch [720/2000] time 2.034 (2.034) data 0.000 (0.001) loss 0.9554 (1.0971) lr 7.0224e-05 eta 0:43:23
epoch [50/50] batch [740/2000] time 2.006 (2.034) data 0.000 (0.001) loss 1.4648 (1.0956) lr 7.0224e-05 eta 0:42:43
epoch [50/50] batch [760/2000] time 1.977 (2.034) data 0.000 (0.001) loss 0.2054 (1.0980) lr 7.0224e-05 eta 0:42:02
epoch [50/50] batch [780/2000] time 2.034 (2.034) data 0.000 (0.001) loss 0.1060 (1.0979) lr 7.0224e-05 eta 0:41:22
epoch [50/50] batch [800/2000] time 2.035 (2.034) data 0.000 (0.001) loss 1.4176 (1.1015) lr 7.0224e-05 eta 0:40:41
epoch [50/50] batch [820/2000] time 2.055 (2.035) data 0.000 (0.001) loss 0.3836 (1.1094) lr 7.0224e-05 eta 0:40:00
epoch [50/50] batch [840/2000] time 2.003 (2.035) data 0.000 (0.001) loss 2.8621 (1.1106) lr 7.0224e-05 eta 0:39:20
epoch [50/50] batch [860/2000] time 2.030 (2.035) data 0.000 (0.001) loss 1.5815 (1.1169) lr 7.0224e-05 eta 0:38:39
epoch [50/50] batch [880/2000] time 2.030 (2.035) data 0.000 (0.001) loss 2.8597 (1.1125) lr 7.0224e-05 eta 0:37:58
epoch [50/50] batch [900/2000] time 2.000 (2.035) data 0.000 (0.001) loss 0.0054 (1.1043) lr 7.0224e-05 eta 0:37:18
epoch [50/50] batch [920/2000] time 2.001 (2.035) data 0.000 (0.001) loss 0.7906 (1.1050) lr 7.0224e-05 eta 0:36:37
epoch [50/50] batch [940/2000] time 2.034 (2.035) data 0.000 (0.001) loss 1.3970 (1.1051) lr 7.0224e-05 eta 0:35:56
epoch [50/50] batch [960/2000] time 2.032 (2.035) data 0.000 (0.001) loss 0.4495 (1.0987) lr 7.0224e-05 eta 0:35:16
epoch [50/50] batch [980/2000] time 2.056 (2.035) data 0.000 (0.001) loss 4.2542 (1.1052) lr 7.0224e-05 eta 0:34:35
epoch [50/50] batch [1000/2000] time 1.976 (2.034) data 0.000 (0.001) loss 1.8171 (1.1125) lr 7.0224e-05 eta 0:33:54
epoch [50/50] batch [1020/2000] time 2.064 (2.034) data 0.000 (0.001) loss 1.5850 (1.1204) lr 7.0224e-05 eta 0:33:13
epoch [50/50] batch [1040/2000] time 2.059 (2.034) data 0.000 (0.001) loss 3.5648 (1.1280) lr 7.0224e-05 eta 0:32:32
epoch [50/50] batch [1060/2000] time 2.058 (2.034) data 0.000 (0.001) loss 0.4043 (1.1333) lr 7.0224e-05 eta 0:31:51
epoch [50/50] batch [1080/2000] time 2.055 (2.034) data 0.000 (0.001) loss 2.3889 (1.1300) lr 7.0224e-05 eta 0:31:11
epoch [50/50] batch [1100/2000] time 1.974 (2.034) data 0.000 (0.001) loss 1.8979 (1.1301) lr 7.0224e-05 eta 0:30:30
epoch [50/50] batch [1120/2000] time 2.002 (2.034) data 0.000 (0.001) loss 1.2796 (1.1287) lr 7.0224e-05 eta 0:29:50
epoch [50/50] batch [1140/2000] time 2.058 (2.034) data 0.001 (0.001) loss 1.3823 (1.1310) lr 7.0224e-05 eta 0:29:09
epoch [50/50] batch [1160/2000] time 2.030 (2.034) data 0.000 (0.001) loss 0.7389 (1.1276) lr 7.0224e-05 eta 0:28:28
epoch [50/50] batch [1180/2000] time 2.032 (2.034) data 0.000 (0.001) loss 0.5209 (1.1280) lr 7.0224e-05 eta 0:27:48
epoch [50/50] batch [1200/2000] time 2.001 (2.034) data 0.000 (0.001) loss 1.0517 (1.1311) lr 7.0224e-05 eta 0:27:07
epoch [50/50] batch [1220/2000] time 1.998 (2.034) data 0.000 (0.001) loss 1.1151 (1.1338) lr 7.0224e-05 eta 0:26:26
epoch [50/50] batch [1240/2000] time 2.057 (2.034) data 0.000 (0.001) loss 2.3510 (1.1308) lr 7.0224e-05 eta 0:25:45
epoch [50/50] batch [1260/2000] time 2.057 (2.034) data 0.000 (0.001) loss 1.2876 (1.1331) lr 7.0224e-05 eta 0:25:05
epoch [50/50] batch [1280/2000] time 2.060 (2.034) data 0.000 (0.001) loss 0.2268 (1.1322) lr 7.0224e-05 eta 0:24:24
epoch [50/50] batch [1300/2000] time 2.055 (2.034) data 0.000 (0.001) loss 1.0375 (1.1358) lr 7.0224e-05 eta 0:23:43
epoch [50/50] batch [1320/2000] time 2.055 (2.034) data 0.000 (0.001) loss 1.9364 (1.1304) lr 7.0224e-05 eta 0:23:03
epoch [50/50] batch [1340/2000] time 2.002 (2.034) data 0.000 (0.001) loss 0.2475 (1.1325) lr 7.0224e-05 eta 0:22:22
epoch [50/50] batch [1360/2000] time 2.058 (2.034) data 0.000 (0.001) loss 0.7460 (1.1324) lr 7.0224e-05 eta 0:21:41
epoch [50/50] batch [1380/2000] time 2.039 (2.034) data 0.000 (0.001) loss 0.6134 (1.1361) lr 7.0224e-05 eta 0:21:01
epoch [50/50] batch [1400/2000] time 2.032 (2.034) data 0.000 (0.001) loss 0.3853 (1.1349) lr 7.0224e-05 eta 0:20:20
epoch [50/50] batch [1420/2000] time 2.040 (2.034) data 0.000 (0.001) loss 0.9977 (1.1382) lr 7.0224e-05 eta 0:19:39
epoch [50/50] batch [1440/2000] time 2.034 (2.034) data 0.000 (0.001) loss 0.1595 (1.1400) lr 7.0224e-05 eta 0:18:58
epoch [50/50] batch [1460/2000] time 2.055 (2.034) data 0.000 (0.001) loss 0.3562 (1.1368) lr 7.0224e-05 eta 0:18:18
epoch [50/50] batch [1480/2000] time 2.033 (2.034) data 0.000 (0.001) loss 0.4094 (1.1370) lr 7.0224e-05 eta 0:17:37
epoch [50/50] batch [1500/2000] time 2.056 (2.034) data 0.000 (0.001) loss 0.2951 (1.1376) lr 7.0224e-05 eta 0:16:56
epoch [50/50] batch [1520/2000] time 2.000 (2.034) data 0.000 (0.001) loss 1.8795 (1.1339) lr 7.0224e-05 eta 0:16:16
epoch [50/50] batch [1540/2000] time 2.034 (2.034) data 0.000 (0.001) loss 3.4836 (1.1332) lr 7.0224e-05 eta 0:15:35
epoch [50/50] batch [1560/2000] time 2.033 (2.034) data 0.000 (0.001) loss 1.7332 (1.1315) lr 7.0224e-05 eta 0:14:54
epoch [50/50] batch [1580/2000] time 2.050 (2.034) data 0.000 (0.001) loss 2.4441 (1.1354) lr 7.0224e-05 eta 0:14:14
epoch [50/50] batch [1600/2000] time 2.059 (2.034) data 0.000 (0.001) loss 0.3037 (1.1339) lr 7.0224e-05 eta 0:13:33
epoch [50/50] batch [1620/2000] time 2.058 (2.034) data 0.000 (0.001) loss 1.6490 (1.1364) lr 7.0224e-05 eta 0:12:52
epoch [50/50] batch [1640/2000] time 2.058 (2.034) data 0.000 (0.001) loss 0.9640 (1.1373) lr 7.0224e-05 eta 0:12:12
epoch [50/50] batch [1660/2000] time 2.007 (2.034) data 0.000 (0.001) loss 0.5959 (1.1400) lr 7.0224e-05 eta 0:11:31
epoch [50/50] batch [1680/2000] time 2.063 (2.034) data 0.001 (0.001) loss 2.2304 (1.1412) lr 7.0224e-05 eta 0:10:50
epoch [50/50] batch [1700/2000] time 2.032 (2.034) data 0.000 (0.001) loss 0.5150 (1.1392) lr 7.0224e-05 eta 0:10:10
epoch [50/50] batch [1720/2000] time 2.031 (2.034) data 0.000 (0.001) loss 2.1241 (1.1415) lr 7.0224e-05 eta 0:09:29
epoch [50/50] batch [1740/2000] time 1.998 (2.034) data 0.000 (0.001) loss 0.3488 (1.1433) lr 7.0224e-05 eta 0:08:48
epoch [50/50] batch [1760/2000] time 2.032 (2.034) data 0.000 (0.001) loss 0.8569 (1.1436) lr 7.0224e-05 eta 0:08:08
epoch [50/50] batch [1780/2000] time 2.031 (2.034) data 0.000 (0.001) loss 0.0759 (1.1446) lr 7.0224e-05 eta 0:07:27
epoch [50/50] batch [1800/2000] time 2.054 (2.034) data 0.000 (0.001) loss 2.1273 (1.1443) lr 7.0224e-05 eta 0:06:46
epoch [50/50] batch [1820/2000] time 2.000 (2.034) data 0.000 (0.001) loss 1.3304 (1.1440) lr 7.0224e-05 eta 0:06:06
epoch [50/50] batch [1840/2000] time 2.056 (2.034) data 0.000 (0.001) loss 1.4202 (1.1468) lr 7.0224e-05 eta 0:05:25
epoch [50/50] batch [1860/2000] time 2.054 (2.034) data 0.000 (0.001) loss 3.0717 (1.1485) lr 7.0224e-05 eta 0:04:44
epoch [50/50] batch [1880/2000] time 2.053 (2.034) data 0.000 (0.001) loss 2.2692 (1.1479) lr 7.0224e-05 eta 0:04:04
epoch [50/50] batch [1900/2000] time 1.977 (2.034) data 0.000 (0.001) loss 0.9273 (1.1520) lr 7.0224e-05 eta 0:03:23
epoch [50/50] batch [1920/2000] time 1.998 (2.034) data 0.000 (0.001) loss 0.4160 (1.1522) lr 7.0224e-05 eta 0:02:42
epoch [50/50] batch [1940/2000] time 2.000 (2.034) data 0.000 (0.001) loss 0.9412 (1.1554) lr 7.0224e-05 eta 0:02:02
epoch [50/50] batch [1960/2000] time 2.056 (2.034) data 0.000 (0.001) loss 2.1163 (1.1553) lr 7.0224e-05 eta 0:01:21
epoch [50/50] batch [1980/2000] time 2.027 (2.034) data 0.000 (0.001) loss 2.3845 (1.1570) lr 7.0224e-05 eta 0:00:40
epoch [50/50] batch [2000/2000] time 2.054 (2.034) data 0.000 (0.001) loss 1.6309 (1.1565) lr 4.8943e-05 eta 0:00:00
Checkpoint saved to output/base2new/train_base/imagenet/vit_b16_ep50_c4_BZ4_ProDA/seed1/prompt_learner/model.pth.tar-50
Finish training
Deploy the last-epoch model
Evaluate on the *test* set
=> result
* total: 25,000
* correct: 19,982
* accuracy: 79.93%
* error: 20.07%
* macro_f1: 79.54%
Elapsed: 3 days, 0:15:48
