***************
** Arguments **
***************
backbone: 
config_file: configs/trainers/ProDA/vit_b16_ep50_c4_BZ4_ProDA.yaml
dataset_config_file: configs/datasets/fgvc_aircraft.yaml
eval_only: False
head: 
load_epoch: None
model_dir: 
no_train: False
opts: ['DATASET.NUM_SHOTS', '16', 'DATASET.SUBSAMPLE_CLASSES', 'base']
output_dir: output/base2new/train_base/fgvc_aircraft/vit_b16_ep50_c4_BZ4_ProDA/seed3
resume: 
root: /mnt/hdd/DATA
seed: 3
source_domains: None
target_domains: None
trainer: ProDA
transforms: None
************
** Config **
************
DATALOADER:
  K_TRANSFORMS: 1
  NUM_WORKERS: 8
  RETURN_IMG0: False
  TEST:
    BATCH_SIZE: 100
    SAMPLER: SequentialSampler
  TRAIN_U:
    BATCH_SIZE: 32
    N_DOMAIN: 0
    N_INS: 16
    SAME_AS_X: True
    SAMPLER: RandomSampler
  TRAIN_X:
    BATCH_SIZE: 4
    N_DOMAIN: 0
    N_INS: 16
    SAMPLER: RandomSampler
DATASET:
  ALL_AS_UNLABELED: False
  CIFAR_C_LEVEL: 1
  CIFAR_C_TYPE: 
  NAME: FGVCAircraft
  NUM_LABELED: -1
  NUM_SHOTS: 16
  ROOT: /mnt/hdd/DATA
  SOURCE_DOMAINS: ()
  STL10_FOLD: -1
  SUBSAMPLE_CLASSES: base
  TARGET_DOMAINS: ()
  VAL_PERCENT: 0.1
INPUT:
  COLORJITTER_B: 0.4
  COLORJITTER_C: 0.4
  COLORJITTER_H: 0.1
  COLORJITTER_S: 0.4
  CROP_PADDING: 4
  CUTOUT_LEN: 16
  CUTOUT_N: 1
  GB_K: 21
  GB_P: 0.5
  GN_MEAN: 0.0
  GN_STD: 0.15
  INTERPOLATION: bicubic
  NO_TRANSFORM: False
  PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
  PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
  RANDAUGMENT_M: 10
  RANDAUGMENT_N: 2
  RGS_P: 0.2
  RRCROP_SCALE: (0.08, 1.0)
  SIZE: (224, 224)
  TRANSFORMS: ('random_resized_crop', 'random_flip', 'normalize')
MODEL:
  BACKBONE:
    NAME: ViT-B/16
    PRETRAINED: True
  HEAD:
    ACTIVATION: relu
    BN: True
    DROPOUT: 0.0
    HIDDEN_LAYERS: ()
    NAME: 
  INIT_WEIGHTS: 
OPTIM:
  ADAM_BETA1: 0.9
  ADAM_BETA2: 0.999
  BASE_LR_MULT: 0.1
  GAMMA: 0.1
  LR: 0.002
  LR_SCHEDULER: cosine
  MAX_EPOCH: 50
  MOMENTUM: 0.9
  NAME: sgd
  NEW_LAYERS: ()
  RMSPROP_ALPHA: 0.99
  SGD_DAMPNING: 0
  SGD_NESTEROV: False
  STAGED_LR: False
  STEPSIZE: (-1,)
  WARMUP_CONS_LR: 1e-05
  WARMUP_EPOCH: 5
  WARMUP_MIN_LR: 1e-05
  WARMUP_RECOUNT: True
  WARMUP_TYPE: constant
  WEIGHT_DECAY: 0.0005
OUTPUT_DIR: output/base2new/train_base/fgvc_aircraft/vit_b16_ep50_c4_BZ4_ProDA/seed3
RESUME: 
SEED: 3
TEST:
  COMPUTE_CMAT: False
  EVALUATOR: Classification
  FINAL_MODEL: last_step
  NO_TEST: False
  PER_CLASS_RESULT: False
  SPLIT: test
TRAIN:
  CHECKPOINT_FREQ: 0
  COUNT_ITER: train_x
  PRINT_FREQ: 20
TRAINER:
  CDAC:
    CLASS_LR_MULTI: 10
    P_THRESH: 0.95
    RAMPUP_COEF: 30
    RAMPUP_ITRS: 1000
    STRONG_TRANSFORMS: ()
    TOPK_MATCH: 5
  COCOOP:
    CTX_INIT: 
    N_CTX: 16
    PREC: fp16
  COOP:
    CLASS_TOKEN_POSITION: end
    CSC: False
    CTX_INIT: 
    N_CTX: 16
    PREC: fp16
  CROSSGRAD:
    ALPHA_D: 0.5
    ALPHA_F: 0.5
    EPS_D: 1.0
    EPS_F: 1.0
  DAEL:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 0.5
  DAELDG:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 0.5
  DDAIG:
    ALPHA: 0.5
    CLAMP: False
    CLAMP_MAX: 1.0
    CLAMP_MIN: -1.0
    G_ARCH: 
    LMDA: 0.3
    WARMUP: 0
  DOMAINMIX:
    ALPHA: 1.0
    BETA: 1.0
    TYPE: crossdomain
  ENTMIN:
    LMDA: 0.001
  FIXMATCH:
    CONF_THRE: 0.95
    STRONG_TRANSFORMS: ()
    WEIGHT_U: 1.0
  IVLP:
    CTX_INIT: a photo of a
    N_CTX_TEXT: 2
    N_CTX_VISION: 2
    PREC: fp16
    PROMPT_DEPTH_TEXT: 9
    PROMPT_DEPTH_VISION: 9
  M3SDA:
    LMDA: 0.5
    N_STEP_F: 4
  MAPLE:
    CTX_INIT: a photo of a
    N_CTX: 4
    PREC: fp16
    PROMPT_DEPTH: 9
  MCD:
    N_STEP_F: 4
  MEANTEACHER:
    EMA_ALPHA: 0.999
    RAMPUP: 5
    WEIGHT_U: 1.0
  MIXMATCH:
    MIXUP_BETA: 0.75
    RAMPUP: 20000
    TEMP: 2.0
    WEIGHT_U: 100.0
  MME:
    LMDA: 0.1
  NAME: ProDA
  ProDA:
    N_CTX: 4
    N_PROMPT: 32
    PREC: fp16
  SE:
    CONF_THRE: 0.95
    EMA_ALPHA: 0.999
    RAMPUP: 300
  VPT:
    CTX_INIT: a photo of a
    N_CTX_VISION: 2
    PREC: fp16
    PROMPT_DEPTH_VISION: 1
USE_CUDA: True
VERBOSE: True
VERSION: 1
Collecting env info ...
** System info **
PyTorch version: 2.2.1+cu121
Is debug build: False
CUDA used to build PyTorch: 12.1
ROCM used to build PyTorch: N/A

OS: Debian GNU/Linux 12 (bookworm) (x86_64)
GCC version: (Debian 12.2.0-14) 12.2.0
Clang version: Could not collect
CMake version: Could not collect
Libc version: glibc-2.36

Python version: 3.11.2 (main, Mar 13 2023, 12:18:29) [GCC 12.2.0] (64-bit runtime)
Python platform: Linux-6.5.13-3-pve-x86_64-with-glibc2.36
Is CUDA available: True
CUDA runtime version: 11.8.89
CUDA_MODULE_LOADING set to: LAZY
GPU models and configuration: 
GPU 0: NVIDIA A800 80GB PCIe
GPU 1: NVIDIA A800 80GB PCIe

Nvidia driver version: 525.147.05
cuDNN version: Could not collect
HIP runtime version: N/A
MIOpen runtime version: N/A
Is XNNPACK available: True

CPU:
Architecture:                       x86_64
CPU op-mode(s):                     32-bit, 64-bit
Address sizes:                      46 bits physical, 57 bits virtual
Byte Order:                         Little Endian
CPU(s):                             64
On-line CPU(s) list:                18,20,22,23,25-27,29,31,32,34,37,46-49
Off-line CPU(s) list:               0-17,19,21,24,28,30,33,35,36,38-45,50-63
Vendor ID:                          GenuineIntel
Model name:                         Intel(R) Xeon(R) Gold 6326 CPU @ 2.90GHz
CPU family:                         6
Model:                              106
Thread(s) per core:                 2
Core(s) per socket:                 16
Socket(s):                          2
Stepping:                           6
CPU(s) scaling MHz:                 98%
CPU max MHz:                        3500.0000
CPU min MHz:                        800.0000
BogoMIPS:                           5800.00
Flags:                              fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp lm constant_tsc art arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc cpuid aperfmperf pni pclmulqdq dtes64 ds_cpl vmx smx est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid dca sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm 3dnowprefetch cpuid_fault epb cat_l3 invpcid_single intel_ppin ssbd mba ibrs ibpb stibp ibrs_enhanced tpr_shadow flexpriority ept vpid ept_ad fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid cqm rdt_a avx512f avx512dq rdseed adx smap avx512ifma clflushopt clwb intel_pt avx512cd sha_ni avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves cqm_llc cqm_occup_llc cqm_mbm_total cqm_mbm_local split_lock_detect wbnoinvd dtherm ida arat pln pts vnmi avx512vbmi umip pku ospke avx512_vbmi2 gfni vaes vpclmulqdq avx512_vnni avx512_bitalg tme avx512_vpopcntdq la57 rdpid fsrm md_clear pconfig flush_l1d arch_capabilities
Virtualization:                     VT-x
L1d cache:                          1.5 MiB (32 instances)
L1i cache:                          1 MiB (32 instances)
L2 cache:                           40 MiB (32 instances)
L3 cache:                           48 MiB (2 instances)
NUMA node(s):                       2
NUMA node0 CPU(s):                  0-15,32-47
NUMA node1 CPU(s):                  16-31,48-63
Vulnerability Gather data sampling: Vulnerable: No microcode
Vulnerability Itlb multihit:        Not affected
Vulnerability L1tf:                 Not affected
Vulnerability Mds:                  Not affected
Vulnerability Meltdown:             Not affected
Vulnerability Mmio stale data:      Mitigation; Clear CPU buffers; SMT vulnerable
Vulnerability Retbleed:             Not affected
Vulnerability Spec rstack overflow: Not affected
Vulnerability Spec store bypass:    Mitigation; Speculative Store Bypass disabled via prctl
Vulnerability Spectre v1:           Mitigation; usercopy/swapgs barriers and __user pointer sanitization
Vulnerability Spectre v2:           Mitigation; Enhanced / Automatic IBRS, IBPB conditional, RSB filling, PBRSB-eIBRS SW sequence
Vulnerability Srbds:                Not affected
Vulnerability Tsx async abort:      Not affected

Versions of relevant libraries:
[pip3] flake8==3.7.9
[pip3] flake8==3.7.9
[pip3] numpy==1.26.4
[pip3] torch==2.2.1
[pip3] torchaudio==2.2.1
[pip3] torchvision==0.17.1
[pip3] triton==2.2.0
[conda] Could not collect
        Pillow (10.2.0)

Loading trainer: ProDA
Loading dataset: FGVCAircraft
Loading preprocessed few-shot data from /mnt/hdd/DATA/fgvc_aircraft/split_fewshot/shot_16_shuffled-seed_3.pkl
SUBSAMPLE BASE CLASSES!
Building transform_train
+ random resized crop (size=(224, 224), scale=(0.08, 1.0))
+ random flip
+ to torch tensor of range [0, 1]
+ normalization (mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])
Building transform_test
+ resize the smaller edge to 224
+ 224x224 center crop
+ to torch tensor of range [0, 1]
+ normalization (mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])
---------  ------------
Dataset    FGVCAircraft
# classes  50
# train_x  800
# val      200
# test     1,670
---------  ------------
Loading CLIP (backbone: ViT-B/16)
Building custom CLIP
Turning off gradients in both the image and the text encoder
Parameters to be updated: {'prompt_learner.ctx'}
Loading evaluator: Classification
No checkpoint found, train from scratch
Initialize tensorboard (log_dir=output/base2new/train_base/fgvc_aircraft/vit_b16_ep50_c4_BZ4_ProDA/seed3/tensorboard)
epoch [1/50] batch [20/200] time 0.240 (0.387) data 0.000 (0.037) loss 4.8529 (3.7293) lr 1.0000e-05 eta 1:04:23
epoch [1/50] batch [40/200] time 0.243 (0.314) data 0.000 (0.019) loss 2.3244 (3.4733) lr 1.0000e-05 eta 0:52:12
epoch [1/50] batch [60/200] time 0.242 (0.290) data 0.001 (0.012) loss 3.2121 (3.5390) lr 1.0000e-05 eta 0:48:01
epoch [1/50] batch [80/200] time 0.239 (0.278) data 0.000 (0.009) loss 1.6466 (3.4717) lr 1.0000e-05 eta 0:45:57
epoch [1/50] batch [100/200] time 0.244 (0.271) data 0.000 (0.008) loss 3.6422 (3.3893) lr 1.0000e-05 eta 0:44:40
epoch [1/50] batch [120/200] time 0.237 (0.266) data 0.000 (0.006) loss 2.6463 (3.3319) lr 1.0000e-05 eta 0:43:46
epoch [1/50] batch [140/200] time 0.238 (0.262) data 0.000 (0.006) loss 3.2921 (3.3404) lr 1.0000e-05 eta 0:43:07
epoch [1/50] batch [160/200] time 0.236 (0.260) data 0.000 (0.005) loss 1.4648 (3.3032) lr 1.0000e-05 eta 0:42:35
epoch [1/50] batch [180/200] time 0.237 (0.257) data 0.000 (0.004) loss 2.3667 (3.3009) lr 1.0000e-05 eta 0:42:08
epoch [1/50] batch [200/200] time 0.247 (0.256) data 0.000 (0.004) loss 5.0577 (3.2988) lr 1.0000e-05 eta 0:41:46
epoch [2/50] batch [20/200] time 0.240 (0.266) data 0.000 (0.025) loss 3.3470 (3.2436) lr 1.0000e-05 eta 0:43:19
epoch [2/50] batch [40/200] time 0.240 (0.253) data 0.000 (0.013) loss 2.1923 (2.9313) lr 1.0000e-05 eta 0:41:10
epoch [2/50] batch [60/200] time 0.241 (0.249) data 0.000 (0.009) loss 0.9841 (2.8430) lr 1.0000e-05 eta 0:40:26
epoch [2/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.006) loss 4.5643 (2.9282) lr 1.0000e-05 eta 0:40:00
epoch [2/50] batch [100/200] time 0.243 (0.246) data 0.000 (0.005) loss 2.3735 (2.9057) lr 1.0000e-05 eta 0:39:43
epoch [2/50] batch [120/200] time 0.245 (0.245) data 0.000 (0.004) loss 2.5597 (2.8633) lr 1.0000e-05 eta 0:39:32
epoch [2/50] batch [140/200] time 0.238 (0.244) data 0.000 (0.004) loss 2.4376 (2.8685) lr 1.0000e-05 eta 0:39:21
epoch [2/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.9592 (2.7853) lr 1.0000e-05 eta 0:39:11
epoch [2/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 3.3637 (2.7914) lr 1.0000e-05 eta 0:39:04
epoch [2/50] batch [200/200] time 0.243 (0.243) data 0.000 (0.003) loss 1.8972 (2.8180) lr 1.0000e-05 eta 0:38:56
epoch [3/50] batch [20/200] time 0.247 (0.267) data 0.000 (0.025) loss 2.8992 (2.7628) lr 1.0000e-05 eta 0:42:33
epoch [3/50] batch [40/200] time 0.243 (0.254) data 0.000 (0.013) loss 1.9603 (2.7363) lr 1.0000e-05 eta 0:40:27
epoch [3/50] batch [60/200] time 0.240 (0.250) data 0.000 (0.009) loss 2.2126 (2.7938) lr 1.0000e-05 eta 0:39:41
epoch [3/50] batch [80/200] time 0.243 (0.248) data 0.000 (0.006) loss 3.2022 (2.7436) lr 1.0000e-05 eta 0:39:16
epoch [3/50] batch [100/200] time 0.243 (0.246) data 0.000 (0.005) loss 2.0556 (2.7493) lr 1.0000e-05 eta 0:38:57
epoch [3/50] batch [120/200] time 0.245 (0.245) data 0.000 (0.004) loss 2.4890 (2.7340) lr 1.0000e-05 eta 0:38:44
epoch [3/50] batch [140/200] time 0.244 (0.245) data 0.000 (0.004) loss 3.0639 (2.7095) lr 1.0000e-05 eta 0:38:34
epoch [3/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.8181 (2.7318) lr 1.0000e-05 eta 0:38:26
epoch [3/50] batch [180/200] time 0.242 (0.244) data 0.000 (0.003) loss 3.1860 (2.7408) lr 1.0000e-05 eta 0:38:18
epoch [3/50] batch [200/200] time 0.237 (0.244) data 0.000 (0.003) loss 2.4017 (2.7289) lr 1.0000e-05 eta 0:38:10
epoch [4/50] batch [20/200] time 0.238 (0.266) data 0.000 (0.025) loss 2.5465 (2.7879) lr 1.0000e-05 eta 0:41:36
epoch [4/50] batch [40/200] time 0.241 (0.254) data 0.000 (0.012) loss 2.8391 (2.8630) lr 1.0000e-05 eta 0:39:36
epoch [4/50] batch [60/200] time 0.244 (0.250) data 0.000 (0.008) loss 2.6155 (2.7366) lr 1.0000e-05 eta 0:38:53
epoch [4/50] batch [80/200] time 0.240 (0.248) data 0.000 (0.006) loss 3.4223 (2.6619) lr 1.0000e-05 eta 0:38:28
epoch [4/50] batch [100/200] time 0.241 (0.246) data 0.000 (0.005) loss 2.1691 (2.6836) lr 1.0000e-05 eta 0:38:10
epoch [4/50] batch [120/200] time 0.241 (0.245) data 0.000 (0.004) loss 1.6007 (2.6844) lr 1.0000e-05 eta 0:37:56
epoch [4/50] batch [140/200] time 0.238 (0.245) data 0.000 (0.004) loss 1.8793 (2.6767) lr 1.0000e-05 eta 0:37:45
epoch [4/50] batch [160/200] time 0.238 (0.244) data 0.000 (0.003) loss 2.4894 (2.6532) lr 1.0000e-05 eta 0:37:35
epoch [4/50] batch [180/200] time 0.237 (0.244) data 0.000 (0.003) loss 2.9628 (2.6248) lr 1.0000e-05 eta 0:37:27
epoch [4/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 2.6896 (2.6402) lr 1.0000e-05 eta 0:37:19
epoch [5/50] batch [20/200] time 0.237 (0.266) data 0.000 (0.025) loss 2.8413 (2.7418) lr 1.0000e-05 eta 0:40:46
epoch [5/50] batch [40/200] time 0.237 (0.254) data 0.000 (0.013) loss 2.2639 (2.7550) lr 1.0000e-05 eta 0:38:46
epoch [5/50] batch [60/200] time 0.241 (0.250) data 0.000 (0.009) loss 2.3626 (2.7107) lr 1.0000e-05 eta 0:38:00
epoch [5/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.006) loss 2.9069 (2.6229) lr 1.0000e-05 eta 0:37:36
epoch [5/50] batch [100/200] time 0.243 (0.246) data 0.000 (0.005) loss 2.2209 (2.5930) lr 1.0000e-05 eta 0:37:21
epoch [5/50] batch [120/200] time 0.244 (0.245) data 0.000 (0.004) loss 2.7639 (2.6302) lr 1.0000e-05 eta 0:37:08
epoch [5/50] batch [140/200] time 0.244 (0.245) data 0.000 (0.004) loss 2.1718 (2.5983) lr 1.0000e-05 eta 0:36:57
epoch [5/50] batch [160/200] time 0.241 (0.244) data 0.000 (0.003) loss 2.9705 (2.6133) lr 1.0000e-05 eta 0:36:49
epoch [5/50] batch [180/200] time 0.244 (0.244) data 0.000 (0.003) loss 3.1515 (2.6410) lr 1.0000e-05 eta 0:36:42
epoch [5/50] batch [200/200] time 0.242 (0.244) data 0.000 (0.003) loss 2.4775 (2.5872) lr 2.0000e-03 eta 0:36:34
epoch [6/50] batch [20/200] time 0.243 (0.267) data 0.000 (0.026) loss 4.7647 (3.0448) lr 2.0000e-03 eta 0:39:53
epoch [6/50] batch [40/200] time 0.237 (0.255) data 0.000 (0.013) loss 2.5888 (3.0376) lr 2.0000e-03 eta 0:38:00
epoch [6/50] batch [60/200] time 0.237 (0.250) data 0.000 (0.009) loss 1.6765 (2.8635) lr 2.0000e-03 eta 0:37:17
epoch [6/50] batch [80/200] time 0.246 (0.248) data 0.000 (0.007) loss 1.6201 (2.7626) lr 2.0000e-03 eta 0:36:51
epoch [6/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 1.0576 (2.6646) lr 2.0000e-03 eta 0:36:33
epoch [6/50] batch [120/200] time 0.237 (0.246) data 0.000 (0.005) loss 2.4830 (2.6555) lr 2.0000e-03 eta 0:36:20
epoch [6/50] batch [140/200] time 0.246 (0.245) data 0.000 (0.004) loss 2.4306 (2.6527) lr 2.0000e-03 eta 0:36:09
epoch [6/50] batch [160/200] time 0.238 (0.244) data 0.000 (0.003) loss 1.7012 (2.6093) lr 2.0000e-03 eta 0:35:59
epoch [6/50] batch [180/200] time 0.241 (0.244) data 0.000 (0.003) loss 2.9816 (2.6017) lr 2.0000e-03 eta 0:35:51
epoch [6/50] batch [200/200] time 0.236 (0.244) data 0.000 (0.003) loss 2.9821 (2.5758) lr 1.9980e-03 eta 0:35:43
epoch [7/50] batch [20/200] time 0.243 (0.266) data 0.000 (0.025) loss 2.4100 (2.4278) lr 1.9980e-03 eta 0:38:54
epoch [7/50] batch [40/200] time 0.241 (0.253) data 0.000 (0.012) loss 2.0612 (2.4270) lr 1.9980e-03 eta 0:36:56
epoch [7/50] batch [60/200] time 0.241 (0.249) data 0.000 (0.008) loss 1.7076 (2.4243) lr 1.9980e-03 eta 0:36:16
epoch [7/50] batch [80/200] time 0.243 (0.247) data 0.000 (0.006) loss 1.4624 (2.3132) lr 1.9980e-03 eta 0:35:53
epoch [7/50] batch [100/200] time 0.241 (0.246) data 0.000 (0.005) loss 2.6121 (2.2909) lr 1.9980e-03 eta 0:35:38
epoch [7/50] batch [120/200] time 0.240 (0.245) data 0.000 (0.004) loss 2.2049 (2.2979) lr 1.9980e-03 eta 0:35:25
epoch [7/50] batch [140/200] time 0.242 (0.244) data 0.000 (0.004) loss 4.2307 (2.3113) lr 1.9980e-03 eta 0:35:15
epoch [7/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.5914 (2.3146) lr 1.9980e-03 eta 0:35:08
epoch [7/50] batch [180/200] time 0.237 (0.244) data 0.000 (0.003) loss 1.2646 (2.2885) lr 1.9980e-03 eta 0:35:01
epoch [7/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.7032 (2.2884) lr 1.9921e-03 eta 0:34:53
epoch [8/50] batch [20/200] time 0.243 (0.266) data 0.000 (0.026) loss 3.0149 (2.2888) lr 1.9921e-03 eta 0:38:06
epoch [8/50] batch [40/200] time 0.242 (0.254) data 0.000 (0.013) loss 2.5338 (2.2568) lr 1.9921e-03 eta 0:36:14
epoch [8/50] batch [60/200] time 0.237 (0.249) data 0.000 (0.009) loss 1.9802 (2.2586) lr 1.9921e-03 eta 0:35:28
epoch [8/50] batch [80/200] time 0.243 (0.247) data 0.000 (0.007) loss 2.0624 (2.2987) lr 1.9921e-03 eta 0:35:06
epoch [8/50] batch [100/200] time 0.242 (0.246) data 0.000 (0.005) loss 1.8584 (2.2787) lr 1.9921e-03 eta 0:34:51
epoch [8/50] batch [120/200] time 0.243 (0.245) data 0.000 (0.004) loss 1.9170 (2.2454) lr 1.9921e-03 eta 0:34:38
epoch [8/50] batch [140/200] time 0.235 (0.244) data 0.000 (0.004) loss 2.6552 (2.2277) lr 1.9921e-03 eta 0:34:27
epoch [8/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.9965 (2.2320) lr 1.9921e-03 eta 0:34:20
epoch [8/50] batch [180/200] time 0.240 (0.244) data 0.000 (0.003) loss 2.3806 (2.2113) lr 1.9921e-03 eta 0:34:11
epoch [8/50] batch [200/200] time 0.240 (0.243) data 0.000 (0.003) loss 1.1424 (2.1829) lr 1.9823e-03 eta 0:34:04
epoch [9/50] batch [20/200] time 0.244 (0.267) data 0.000 (0.026) loss 3.5169 (2.3014) lr 1.9823e-03 eta 0:37:15
epoch [9/50] batch [40/200] time 0.243 (0.254) data 0.000 (0.013) loss 3.0118 (2.1789) lr 1.9823e-03 eta 0:35:20
epoch [9/50] batch [60/200] time 0.241 (0.249) data 0.000 (0.009) loss 2.1076 (2.0450) lr 1.9823e-03 eta 0:34:39
epoch [9/50] batch [80/200] time 0.243 (0.247) data 0.000 (0.007) loss 2.5439 (2.0831) lr 1.9823e-03 eta 0:34:19
epoch [9/50] batch [100/200] time 0.241 (0.246) data 0.000 (0.005) loss 2.9679 (2.0858) lr 1.9823e-03 eta 0:34:03
epoch [9/50] batch [120/200] time 0.237 (0.245) data 0.000 (0.004) loss 2.2000 (2.1307) lr 1.9823e-03 eta 0:33:51
epoch [9/50] batch [140/200] time 0.243 (0.245) data 0.000 (0.004) loss 2.3555 (2.1255) lr 1.9823e-03 eta 0:33:42
epoch [9/50] batch [160/200] time 0.237 (0.244) data 0.000 (0.003) loss 2.6707 (2.0999) lr 1.9823e-03 eta 0:33:33
epoch [9/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 2.3790 (2.1113) lr 1.9823e-03 eta 0:33:25
epoch [9/50] batch [200/200] time 0.242 (0.244) data 0.000 (0.003) loss 3.9551 (2.1285) lr 1.9686e-03 eta 0:33:17
epoch [10/50] batch [20/200] time 0.243 (0.267) data 0.000 (0.025) loss 1.6199 (1.9658) lr 1.9686e-03 eta 0:36:22
epoch [10/50] batch [40/200] time 0.240 (0.253) data 0.000 (0.013) loss 2.4514 (2.1451) lr 1.9686e-03 eta 0:34:27
epoch [10/50] batch [60/200] time 0.237 (0.249) data 0.000 (0.009) loss 2.0856 (2.1822) lr 1.9686e-03 eta 0:33:47
epoch [10/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.006) loss 3.4331 (2.1389) lr 1.9686e-03 eta 0:33:25
epoch [10/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 1.3492 (2.1522) lr 1.9686e-03 eta 0:33:11
epoch [10/50] batch [120/200] time 0.235 (0.245) data 0.000 (0.004) loss 1.8920 (2.1361) lr 1.9686e-03 eta 0:33:00
epoch [10/50] batch [140/200] time 0.242 (0.244) data 0.000 (0.004) loss 1.5118 (2.1469) lr 1.9686e-03 eta 0:32:50
epoch [10/50] batch [160/200] time 0.237 (0.244) data 0.000 (0.003) loss 1.9119 (2.1357) lr 1.9686e-03 eta 0:32:41
epoch [10/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.8607 (2.1187) lr 1.9686e-03 eta 0:32:34
epoch [10/50] batch [200/200] time 0.237 (0.243) data 0.000 (0.003) loss 2.0547 (2.1089) lr 1.9511e-03 eta 0:32:26
epoch [11/50] batch [20/200] time 0.241 (0.268) data 0.000 (0.026) loss 1.7615 (2.1404) lr 1.9511e-03 eta 0:35:38
epoch [11/50] batch [40/200] time 0.238 (0.254) data 0.000 (0.013) loss 3.3173 (2.0035) lr 1.9511e-03 eta 0:33:43
epoch [11/50] batch [60/200] time 0.240 (0.250) data 0.000 (0.009) loss 1.4356 (2.0567) lr 1.9511e-03 eta 0:33:02
epoch [11/50] batch [80/200] time 0.243 (0.247) data 0.000 (0.007) loss 1.3488 (2.0592) lr 1.9511e-03 eta 0:32:38
epoch [11/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 2.1910 (2.0715) lr 1.9511e-03 eta 0:32:21
epoch [11/50] batch [120/200] time 0.240 (0.245) data 0.000 (0.004) loss 2.8055 (2.1277) lr 1.9511e-03 eta 0:32:10
epoch [11/50] batch [140/200] time 0.237 (0.245) data 0.000 (0.004) loss 1.0527 (2.0998) lr 1.9511e-03 eta 0:32:01
epoch [11/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.9175 (2.1006) lr 1.9511e-03 eta 0:31:53
epoch [11/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.8599 (2.1067) lr 1.9511e-03 eta 0:31:46
epoch [11/50] batch [200/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.9165 (2.1211) lr 1.9298e-03 eta 0:31:39
epoch [12/50] batch [20/200] time 0.243 (0.266) data 0.000 (0.026) loss 2.2483 (1.9847) lr 1.9298e-03 eta 0:34:29
epoch [12/50] batch [40/200] time 0.237 (0.253) data 0.000 (0.013) loss 2.2089 (1.9772) lr 1.9298e-03 eta 0:32:44
epoch [12/50] batch [60/200] time 0.243 (0.249) data 0.000 (0.009) loss 1.6562 (1.9626) lr 1.9298e-03 eta 0:32:07
epoch [12/50] batch [80/200] time 0.244 (0.247) data 0.000 (0.007) loss 2.3041 (2.0131) lr 1.9298e-03 eta 0:31:47
epoch [12/50] batch [100/200] time 0.238 (0.246) data 0.000 (0.005) loss 1.4644 (2.0249) lr 1.9298e-03 eta 0:31:33
epoch [12/50] batch [120/200] time 0.243 (0.245) data 0.000 (0.004) loss 1.8714 (2.0325) lr 1.9298e-03 eta 0:31:22
epoch [12/50] batch [140/200] time 0.240 (0.244) data 0.000 (0.004) loss 3.2747 (2.0126) lr 1.9298e-03 eta 0:31:12
epoch [12/50] batch [160/200] time 0.238 (0.244) data 0.000 (0.003) loss 1.8321 (1.9998) lr 1.9298e-03 eta 0:31:03
epoch [12/50] batch [180/200] time 0.238 (0.244) data 0.000 (0.003) loss 1.3908 (1.9835) lr 1.9298e-03 eta 0:30:56
epoch [12/50] batch [200/200] time 0.235 (0.243) data 0.000 (0.003) loss 2.5551 (2.0176) lr 1.9048e-03 eta 0:30:48
epoch [13/50] batch [20/200] time 0.244 (0.267) data 0.000 (0.026) loss 1.6474 (2.1872) lr 1.9048e-03 eta 0:33:40
epoch [13/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 2.5716 (2.0667) lr 1.9048e-03 eta 0:31:56
epoch [13/50] batch [60/200] time 0.244 (0.249) data 0.000 (0.009) loss 2.5534 (2.0942) lr 1.9048e-03 eta 0:31:19
epoch [13/50] batch [80/200] time 0.251 (0.247) data 0.000 (0.007) loss 1.4645 (2.0887) lr 1.9048e-03 eta 0:30:59
epoch [13/50] batch [100/200] time 0.235 (0.246) data 0.000 (0.005) loss 3.1197 (2.0785) lr 1.9048e-03 eta 0:30:45
epoch [13/50] batch [120/200] time 0.241 (0.245) data 0.000 (0.004) loss 2.6529 (2.0860) lr 1.9048e-03 eta 0:30:34
epoch [13/50] batch [140/200] time 0.243 (0.245) data 0.000 (0.004) loss 1.8707 (2.0714) lr 1.9048e-03 eta 0:30:24
epoch [13/50] batch [160/200] time 0.242 (0.244) data 0.000 (0.003) loss 1.9510 (2.0765) lr 1.9048e-03 eta 0:30:16
epoch [13/50] batch [180/200] time 0.244 (0.244) data 0.000 (0.003) loss 2.2680 (2.0838) lr 1.9048e-03 eta 0:30:08
epoch [13/50] batch [200/200] time 0.236 (0.243) data 0.000 (0.003) loss 2.0862 (2.0801) lr 1.8763e-03 eta 0:30:01
epoch [14/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 2.0027 (1.8009) lr 1.8763e-03 eta 0:32:43
epoch [14/50] batch [40/200] time 0.238 (0.253) data 0.000 (0.013) loss 2.6282 (1.9785) lr 1.8763e-03 eta 0:31:04
epoch [14/50] batch [60/200] time 0.243 (0.249) data 0.000 (0.009) loss 1.7475 (2.0518) lr 1.8763e-03 eta 0:30:30
epoch [14/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.006) loss 1.6318 (1.9651) lr 1.8763e-03 eta 0:30:09
epoch [14/50] batch [100/200] time 0.243 (0.246) data 0.000 (0.005) loss 1.9012 (1.9514) lr 1.8763e-03 eta 0:29:55
epoch [14/50] batch [120/200] time 0.242 (0.245) data 0.000 (0.004) loss 3.0130 (1.9800) lr 1.8763e-03 eta 0:29:46
epoch [14/50] batch [140/200] time 0.244 (0.245) data 0.000 (0.004) loss 2.5980 (2.0121) lr 1.8763e-03 eta 0:29:37
epoch [14/50] batch [160/200] time 0.243 (0.244) data 0.000 (0.003) loss 2.0427 (1.9970) lr 1.8763e-03 eta 0:29:29
epoch [14/50] batch [180/200] time 0.237 (0.244) data 0.000 (0.003) loss 3.1570 (1.9893) lr 1.8763e-03 eta 0:29:21
epoch [14/50] batch [200/200] time 0.237 (0.244) data 0.000 (0.003) loss 2.0237 (2.0019) lr 1.8443e-03 eta 0:29:15
epoch [15/50] batch [20/200] time 0.243 (0.266) data 0.000 (0.025) loss 2.4978 (2.0719) lr 1.8443e-03 eta 0:31:52
epoch [15/50] batch [40/200] time 0.241 (0.254) data 0.000 (0.013) loss 1.7288 (1.9144) lr 1.8443e-03 eta 0:30:15
epoch [15/50] batch [60/200] time 0.241 (0.249) data 0.000 (0.008) loss 2.5622 (1.9384) lr 1.8443e-03 eta 0:29:41
epoch [15/50] batch [80/200] time 0.242 (0.248) data 0.000 (0.006) loss 1.4908 (1.9308) lr 1.8443e-03 eta 0:29:22
epoch [15/50] batch [100/200] time 0.242 (0.246) data 0.000 (0.005) loss 1.3719 (1.9253) lr 1.8443e-03 eta 0:29:08
epoch [15/50] batch [120/200] time 0.237 (0.245) data 0.000 (0.004) loss 2.2568 (1.9313) lr 1.8443e-03 eta 0:28:55
epoch [15/50] batch [140/200] time 0.243 (0.244) data 0.000 (0.004) loss 2.1728 (1.9329) lr 1.8443e-03 eta 0:28:45
epoch [15/50] batch [160/200] time 0.242 (0.244) data 0.000 (0.003) loss 2.0352 (1.9748) lr 1.8443e-03 eta 0:28:37
epoch [15/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.7885 (1.9633) lr 1.8443e-03 eta 0:28:29
epoch [15/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.5565 (1.9646) lr 1.8090e-03 eta 0:28:22
epoch [16/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.026) loss 1.7666 (1.9782) lr 1.8090e-03 eta 0:30:59
epoch [16/50] batch [40/200] time 0.237 (0.253) data 0.000 (0.013) loss 1.4985 (1.9544) lr 1.8090e-03 eta 0:29:21
epoch [16/50] batch [60/200] time 0.239 (0.249) data 0.000 (0.009) loss 1.7593 (1.9191) lr 1.8090e-03 eta 0:28:46
epoch [16/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.007) loss 2.5517 (1.9363) lr 1.8090e-03 eta 0:28:28
epoch [16/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 2.3144 (1.9736) lr 1.8090e-03 eta 0:28:12
epoch [16/50] batch [120/200] time 0.234 (0.244) data 0.000 (0.004) loss 1.9938 (1.9573) lr 1.8090e-03 eta 0:28:01
epoch [16/50] batch [140/200] time 0.241 (0.244) data 0.000 (0.004) loss 2.6129 (1.9610) lr 1.8090e-03 eta 0:27:52
epoch [16/50] batch [160/200] time 0.243 (0.243) data 0.000 (0.003) loss 2.7250 (1.9521) lr 1.8090e-03 eta 0:27:44
epoch [16/50] batch [180/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.8216 (1.9602) lr 1.8090e-03 eta 0:27:37
epoch [16/50] batch [200/200] time 0.239 (0.243) data 0.000 (0.003) loss 1.7402 (1.9800) lr 1.7705e-03 eta 0:27:30
epoch [17/50] batch [20/200] time 0.243 (0.265) data 0.000 (0.025) loss 2.1184 (2.0572) lr 1.7705e-03 eta 0:29:59
epoch [17/50] batch [40/200] time 0.240 (0.253) data 0.000 (0.013) loss 2.6478 (2.0125) lr 1.7705e-03 eta 0:28:28
epoch [17/50] batch [60/200] time 0.242 (0.248) data 0.000 (0.009) loss 2.2443 (1.9829) lr 1.7705e-03 eta 0:27:54
epoch [17/50] batch [80/200] time 0.243 (0.246) data 0.000 (0.007) loss 3.1543 (1.9718) lr 1.7705e-03 eta 0:27:35
epoch [17/50] batch [100/200] time 0.251 (0.245) data 0.000 (0.005) loss 2.1520 (1.9790) lr 1.7705e-03 eta 0:27:23
epoch [17/50] batch [120/200] time 0.243 (0.244) data 0.000 (0.004) loss 0.8759 (1.9878) lr 1.7705e-03 eta 0:27:11
epoch [17/50] batch [140/200] time 0.240 (0.244) data 0.000 (0.004) loss 1.4828 (1.9708) lr 1.7705e-03 eta 0:27:02
epoch [17/50] batch [160/200] time 0.243 (0.243) data 0.000 (0.003) loss 1.8908 (1.9889) lr 1.7705e-03 eta 0:26:55
epoch [17/50] batch [180/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.6705 (2.0143) lr 1.7705e-03 eta 0:26:48
epoch [17/50] batch [200/200] time 0.235 (0.243) data 0.000 (0.003) loss 1.2240 (2.0381) lr 1.7290e-03 eta 0:26:41
epoch [18/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 1.4392 (1.6759) lr 1.7290e-03 eta 0:29:09
epoch [18/50] batch [40/200] time 0.239 (0.252) data 0.000 (0.013) loss 1.2333 (1.6951) lr 1.7290e-03 eta 0:27:35
epoch [18/50] batch [60/200] time 0.239 (0.248) data 0.000 (0.009) loss 2.6498 (1.7787) lr 1.7290e-03 eta 0:27:03
epoch [18/50] batch [80/200] time 0.242 (0.246) data 0.000 (0.007) loss 0.8547 (1.8105) lr 1.7290e-03 eta 0:26:44
epoch [18/50] batch [100/200] time 0.241 (0.245) data 0.000 (0.005) loss 1.3463 (1.8456) lr 1.7290e-03 eta 0:26:31
epoch [18/50] batch [120/200] time 0.239 (0.244) data 0.000 (0.004) loss 3.7084 (1.9256) lr 1.7290e-03 eta 0:26:21
epoch [18/50] batch [140/200] time 0.246 (0.244) data 0.000 (0.004) loss 1.6559 (1.9234) lr 1.7290e-03 eta 0:26:13
epoch [18/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.2862 (1.9328) lr 1.7290e-03 eta 0:26:05
epoch [18/50] batch [180/200] time 0.239 (0.243) data 0.000 (0.003) loss 2.8327 (1.9210) lr 1.7290e-03 eta 0:25:58
epoch [18/50] batch [200/200] time 0.236 (0.242) data 0.000 (0.003) loss 1.5522 (1.9407) lr 1.6845e-03 eta 0:25:51
epoch [19/50] batch [20/200] time 0.237 (0.265) data 0.000 (0.026) loss 2.0084 (2.0917) lr 1.6845e-03 eta 0:28:13
epoch [19/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 2.3165 (2.0751) lr 1.6845e-03 eta 0:26:51
epoch [19/50] batch [60/200] time 0.240 (0.249) data 0.000 (0.009) loss 1.5208 (2.0775) lr 1.6845e-03 eta 0:26:17
epoch [19/50] batch [80/200] time 0.244 (0.247) data 0.000 (0.007) loss 2.4371 (2.0619) lr 1.6845e-03 eta 0:26:03
epoch [19/50] batch [100/200] time 0.241 (0.247) data 0.000 (0.005) loss 0.8184 (2.0042) lr 1.6845e-03 eta 0:25:52
epoch [19/50] batch [120/200] time 0.245 (0.246) data 0.000 (0.005) loss 0.9689 (1.9699) lr 1.6845e-03 eta 0:25:42
epoch [19/50] batch [140/200] time 0.243 (0.245) data 0.000 (0.004) loss 2.9049 (1.9588) lr 1.6845e-03 eta 0:25:35
epoch [19/50] batch [160/200] time 0.244 (0.245) data 0.000 (0.003) loss 1.4839 (1.9314) lr 1.6845e-03 eta 0:25:27
epoch [19/50] batch [180/200] time 0.241 (0.244) data 0.000 (0.003) loss 1.0028 (1.9439) lr 1.6845e-03 eta 0:25:20
epoch [19/50] batch [200/200] time 0.241 (0.244) data 0.000 (0.003) loss 1.6459 (1.9482) lr 1.6374e-03 eta 0:25:13
epoch [20/50] batch [20/200] time 0.239 (0.268) data 0.000 (0.026) loss 1.7937 (1.7555) lr 1.6374e-03 eta 0:27:38
epoch [20/50] batch [40/200] time 0.243 (0.255) data 0.000 (0.013) loss 2.0170 (1.8678) lr 1.6374e-03 eta 0:26:10
epoch [20/50] batch [60/200] time 0.242 (0.250) data 0.000 (0.009) loss 2.1311 (1.9243) lr 1.6374e-03 eta 0:25:37
epoch [20/50] batch [80/200] time 0.243 (0.249) data 0.000 (0.007) loss 2.4620 (1.9738) lr 1.6374e-03 eta 0:25:21
epoch [20/50] batch [100/200] time 0.237 (0.247) data 0.000 (0.005) loss 2.5325 (2.0006) lr 1.6374e-03 eta 0:25:07
epoch [20/50] batch [120/200] time 0.238 (0.246) data 0.000 (0.005) loss 1.6492 (2.0064) lr 1.6374e-03 eta 0:24:57
epoch [20/50] batch [140/200] time 0.242 (0.246) data 0.000 (0.004) loss 2.6200 (2.0101) lr 1.6374e-03 eta 0:24:47
epoch [20/50] batch [160/200] time 0.243 (0.245) data 0.000 (0.003) loss 2.0201 (1.9931) lr 1.6374e-03 eta 0:24:38
epoch [20/50] batch [180/200] time 0.245 (0.244) data 0.000 (0.003) loss 1.8037 (1.9915) lr 1.6374e-03 eta 0:24:30
epoch [20/50] batch [200/200] time 0.241 (0.244) data 0.000 (0.003) loss 1.4298 (1.9624) lr 1.5878e-03 eta 0:24:22
epoch [21/50] batch [20/200] time 0.239 (0.266) data 0.000 (0.026) loss 1.9594 (1.8976) lr 1.5878e-03 eta 0:26:29
epoch [21/50] batch [40/200] time 0.240 (0.253) data 0.000 (0.013) loss 0.9487 (1.9132) lr 1.5878e-03 eta 0:25:09
epoch [21/50] batch [60/200] time 0.240 (0.249) data 0.000 (0.009) loss 1.0678 (1.8472) lr 1.5878e-03 eta 0:24:38
epoch [21/50] batch [80/200] time 0.240 (0.247) data 0.000 (0.007) loss 1.4629 (1.7965) lr 1.5878e-03 eta 0:24:20
epoch [21/50] batch [100/200] time 0.243 (0.245) data 0.000 (0.005) loss 2.4450 (1.8517) lr 1.5878e-03 eta 0:24:08
epoch [21/50] batch [120/200] time 0.240 (0.245) data 0.000 (0.004) loss 2.1739 (1.8886) lr 1.5878e-03 eta 0:23:57
epoch [21/50] batch [140/200] time 0.240 (0.244) data 0.000 (0.004) loss 2.1766 (1.8838) lr 1.5878e-03 eta 0:23:48
epoch [21/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.9972 (1.8430) lr 1.5878e-03 eta 0:23:40
epoch [21/50] batch [180/200] time 0.237 (0.243) data 0.000 (0.003) loss 2.9027 (1.8695) lr 1.5878e-03 eta 0:23:33
epoch [21/50] batch [200/200] time 0.245 (0.243) data 0.000 (0.003) loss 2.0199 (1.8865) lr 1.5358e-03 eta 0:23:26
epoch [22/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 1.0488 (1.9699) lr 1.5358e-03 eta 0:25:36
epoch [22/50] batch [40/200] time 0.236 (0.253) data 0.000 (0.013) loss 2.0142 (2.0716) lr 1.5358e-03 eta 0:24:15
epoch [22/50] batch [60/200] time 0.239 (0.248) data 0.000 (0.008) loss 1.5259 (1.9661) lr 1.5358e-03 eta 0:23:45
epoch [22/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 2.3619 (1.8895) lr 1.5358e-03 eta 0:23:27
epoch [22/50] batch [100/200] time 0.239 (0.245) data 0.000 (0.005) loss 1.7180 (1.8542) lr 1.5358e-03 eta 0:23:14
epoch [22/50] batch [120/200] time 0.233 (0.244) data 0.000 (0.004) loss 1.7619 (1.8443) lr 1.5358e-03 eta 0:23:05
epoch [22/50] batch [140/200] time 0.239 (0.243) data 0.000 (0.004) loss 2.0797 (1.8366) lr 1.5358e-03 eta 0:22:57
epoch [22/50] batch [160/200] time 0.234 (0.243) data 0.000 (0.003) loss 1.5990 (1.8728) lr 1.5358e-03 eta 0:22:50
epoch [22/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.6013 (1.8697) lr 1.5358e-03 eta 0:22:43
epoch [22/50] batch [200/200] time 0.236 (0.242) data 0.000 (0.003) loss 3.3441 (1.8816) lr 1.4818e-03 eta 0:22:37
epoch [23/50] batch [20/200] time 0.242 (0.265) data 0.000 (0.024) loss 1.0271 (1.8847) lr 1.4818e-03 eta 0:24:39
epoch [23/50] batch [40/200] time 0.243 (0.252) data 0.000 (0.012) loss 1.5873 (1.8331) lr 1.4818e-03 eta 0:23:23
epoch [23/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.008) loss 2.2532 (1.8460) lr 1.4818e-03 eta 0:22:57
epoch [23/50] batch [80/200] time 0.239 (0.246) data 0.000 (0.006) loss 2.1390 (1.8982) lr 1.4818e-03 eta 0:22:39
epoch [23/50] batch [100/200] time 0.245 (0.245) data 0.000 (0.005) loss 1.3336 (1.9046) lr 1.4818e-03 eta 0:22:27
epoch [23/50] batch [120/200] time 0.236 (0.244) data 0.000 (0.004) loss 2.4658 (1.8982) lr 1.4818e-03 eta 0:22:17
epoch [23/50] batch [140/200] time 0.241 (0.243) data 0.000 (0.004) loss 2.2355 (1.9243) lr 1.4818e-03 eta 0:22:09
epoch [23/50] batch [160/200] time 0.239 (0.243) data 0.000 (0.003) loss 1.6370 (1.9101) lr 1.4818e-03 eta 0:22:01
epoch [23/50] batch [180/200] time 0.240 (0.243) data 0.000 (0.003) loss 2.0901 (1.8995) lr 1.4818e-03 eta 0:21:54
epoch [23/50] batch [200/200] time 0.241 (0.242) data 0.000 (0.003) loss 1.2591 (1.8952) lr 1.4258e-03 eta 0:21:48
epoch [24/50] batch [20/200] time 0.240 (0.266) data 0.000 (0.025) loss 2.0932 (2.0471) lr 1.4258e-03 eta 0:23:51
epoch [24/50] batch [40/200] time 0.240 (0.253) data 0.000 (0.013) loss 3.0292 (1.8870) lr 1.4258e-03 eta 0:22:38
epoch [24/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.008) loss 1.2668 (1.8671) lr 1.4258e-03 eta 0:22:09
epoch [24/50] batch [80/200] time 0.236 (0.247) data 0.000 (0.006) loss 1.4295 (1.8754) lr 1.4258e-03 eta 0:21:52
epoch [24/50] batch [100/200] time 0.236 (0.245) data 0.000 (0.005) loss 2.6043 (1.9170) lr 1.4258e-03 eta 0:21:40
epoch [24/50] batch [120/200] time 0.242 (0.244) data 0.000 (0.004) loss 1.8874 (1.8827) lr 1.4258e-03 eta 0:21:30
epoch [24/50] batch [140/200] time 0.237 (0.244) data 0.000 (0.004) loss 2.0223 (1.8802) lr 1.4258e-03 eta 0:21:22
epoch [24/50] batch [160/200] time 0.244 (0.243) data 0.000 (0.003) loss 0.9755 (1.8797) lr 1.4258e-03 eta 0:21:15
epoch [24/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.4971 (1.8888) lr 1.4258e-03 eta 0:21:08
epoch [24/50] batch [200/200] time 0.239 (0.243) data 0.000 (0.003) loss 2.0001 (1.9101) lr 1.3681e-03 eta 0:21:01
epoch [25/50] batch [20/200] time 0.241 (0.265) data 0.000 (0.025) loss 1.4188 (1.7240) lr 1.3681e-03 eta 0:22:52
epoch [25/50] batch [40/200] time 0.242 (0.252) data 0.000 (0.013) loss 2.1423 (1.8259) lr 1.3681e-03 eta 0:21:41
epoch [25/50] batch [60/200] time 0.236 (0.248) data 0.000 (0.009) loss 1.0021 (1.8290) lr 1.3681e-03 eta 0:21:16
epoch [25/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 0.7301 (1.8494) lr 1.3681e-03 eta 0:21:01
epoch [25/50] batch [100/200] time 0.244 (0.245) data 0.003 (0.005) loss 2.0028 (1.8662) lr 1.3681e-03 eta 0:20:49
epoch [25/50] batch [120/200] time 0.241 (0.244) data 0.000 (0.004) loss 1.2949 (1.8755) lr 1.3681e-03 eta 0:20:40
epoch [25/50] batch [140/200] time 0.241 (0.244) data 0.000 (0.004) loss 1.8099 (1.8838) lr 1.3681e-03 eta 0:20:32
epoch [25/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.7350 (1.9196) lr 1.3681e-03 eta 0:20:25
epoch [25/50] batch [180/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.3446 (1.9118) lr 1.3681e-03 eta 0:20:18
epoch [25/50] batch [200/200] time 0.235 (0.242) data 0.000 (0.003) loss 1.1964 (1.9152) lr 1.3090e-03 eta 0:20:12
epoch [26/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 2.0855 (1.9341) lr 1.3090e-03 eta 0:22:04
epoch [26/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 2.3867 (1.9799) lr 1.3090e-03 eta 0:20:55
epoch [26/50] batch [60/200] time 0.236 (0.249) data 0.000 (0.009) loss 1.7936 (1.9409) lr 1.3090e-03 eta 0:20:29
epoch [26/50] batch [80/200] time 0.237 (0.247) data 0.000 (0.007) loss 1.4319 (1.9384) lr 1.3090e-03 eta 0:20:13
epoch [26/50] batch [100/200] time 0.240 (0.245) data 0.000 (0.005) loss 1.8384 (1.9604) lr 1.3090e-03 eta 0:20:02
epoch [26/50] batch [120/200] time 0.241 (0.245) data 0.000 (0.004) loss 1.2297 (1.8992) lr 1.3090e-03 eta 0:19:53
epoch [26/50] batch [140/200] time 0.240 (0.244) data 0.000 (0.004) loss 1.7265 (1.8771) lr 1.3090e-03 eta 0:19:45
epoch [26/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.5256 (1.8858) lr 1.3090e-03 eta 0:19:38
epoch [26/50] batch [180/200] time 0.243 (0.243) data 0.000 (0.003) loss 1.8382 (1.8886) lr 1.3090e-03 eta 0:19:31
epoch [26/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.2386 (1.8808) lr 1.2487e-03 eta 0:19:24
epoch [27/50] batch [20/200] time 0.243 (0.265) data 0.000 (0.025) loss 1.1895 (1.8951) lr 1.2487e-03 eta 0:21:08
epoch [27/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.012) loss 1.4215 (1.8537) lr 1.2487e-03 eta 0:20:02
epoch [27/50] batch [60/200] time 0.239 (0.248) data 0.000 (0.008) loss 1.8736 (1.8459) lr 1.2487e-03 eta 0:19:37
epoch [27/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 2.1936 (1.8582) lr 1.2487e-03 eta 0:19:22
epoch [27/50] batch [100/200] time 0.235 (0.245) data 0.000 (0.005) loss 2.1329 (1.8288) lr 1.2487e-03 eta 0:19:10
epoch [27/50] batch [120/200] time 0.237 (0.244) data 0.000 (0.004) loss 3.1638 (1.8502) lr 1.2487e-03 eta 0:19:01
epoch [27/50] batch [140/200] time 0.241 (0.243) data 0.000 (0.004) loss 2.3177 (1.8617) lr 1.2487e-03 eta 0:18:54
epoch [27/50] batch [160/200] time 0.245 (0.243) data 0.000 (0.003) loss 2.2516 (1.8829) lr 1.2487e-03 eta 0:18:47
epoch [27/50] batch [180/200] time 0.240 (0.243) data 0.000 (0.003) loss 2.4029 (1.8497) lr 1.2487e-03 eta 0:18:40
epoch [27/50] batch [200/200] time 0.242 (0.242) data 0.000 (0.003) loss 1.0384 (1.8441) lr 1.1874e-03 eta 0:18:34
epoch [28/50] batch [20/200] time 0.239 (0.265) data 0.000 (0.025) loss 0.8697 (1.7314) lr 1.1874e-03 eta 0:20:12
epoch [28/50] batch [40/200] time 0.235 (0.252) data 0.000 (0.013) loss 2.0801 (1.7955) lr 1.1874e-03 eta 0:19:09
epoch [28/50] batch [60/200] time 0.243 (0.248) data 0.000 (0.008) loss 1.8600 (1.7498) lr 1.1874e-03 eta 0:18:45
epoch [28/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 0.9337 (1.8028) lr 1.1874e-03 eta 0:18:31
epoch [28/50] batch [100/200] time 0.237 (0.245) data 0.000 (0.005) loss 1.9032 (1.7820) lr 1.1874e-03 eta 0:18:21
epoch [28/50] batch [120/200] time 0.241 (0.244) data 0.000 (0.004) loss 3.2847 (1.8336) lr 1.1874e-03 eta 0:18:12
epoch [28/50] batch [140/200] time 0.239 (0.243) data 0.000 (0.004) loss 3.1403 (1.8495) lr 1.1874e-03 eta 0:18:05
epoch [28/50] batch [160/200] time 0.245 (0.243) data 0.000 (0.003) loss 1.1235 (1.8192) lr 1.1874e-03 eta 0:17:58
epoch [28/50] batch [180/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.7956 (1.7981) lr 1.1874e-03 eta 0:17:52
epoch [28/50] batch [200/200] time 0.241 (0.242) data 0.000 (0.003) loss 2.7504 (1.8061) lr 1.1253e-03 eta 0:17:46
epoch [29/50] batch [20/200] time 0.236 (0.264) data 0.000 (0.025) loss 2.2436 (1.8947) lr 1.1253e-03 eta 0:19:17
epoch [29/50] batch [40/200] time 0.237 (0.252) data 0.000 (0.013) loss 2.2718 (1.7898) lr 1.1253e-03 eta 0:18:17
epoch [29/50] batch [60/200] time 0.239 (0.248) data 0.000 (0.009) loss 2.1023 (1.7938) lr 1.1253e-03 eta 0:17:54
epoch [29/50] batch [80/200] time 0.241 (0.246) data 0.000 (0.006) loss 3.4650 (1.8634) lr 1.1253e-03 eta 0:17:40
epoch [29/50] batch [100/200] time 0.241 (0.245) data 0.000 (0.005) loss 1.3546 (1.8478) lr 1.1253e-03 eta 0:17:31
epoch [29/50] batch [120/200] time 0.234 (0.244) data 0.000 (0.004) loss 2.6982 (1.8478) lr 1.1253e-03 eta 0:17:22
epoch [29/50] batch [140/200] time 0.234 (0.243) data 0.000 (0.004) loss 2.5100 (1.8437) lr 1.1253e-03 eta 0:17:15
epoch [29/50] batch [160/200] time 0.239 (0.243) data 0.000 (0.003) loss 3.0925 (1.8688) lr 1.1253e-03 eta 0:17:08
epoch [29/50] batch [180/200] time 0.239 (0.242) data 0.000 (0.003) loss 2.2063 (1.8721) lr 1.1253e-03 eta 0:17:02
epoch [29/50] batch [200/200] time 0.235 (0.242) data 0.000 (0.003) loss 2.0323 (1.8481) lr 1.0628e-03 eta 0:16:56
epoch [30/50] batch [20/200] time 0.237 (0.265) data 0.000 (0.025) loss 1.4268 (1.7845) lr 1.0628e-03 eta 0:18:29
epoch [30/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 1.9541 (1.9356) lr 1.0628e-03 eta 0:17:33
epoch [30/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.009) loss 1.8759 (1.8241) lr 1.0628e-03 eta 0:17:11
epoch [30/50] batch [80/200] time 0.236 (0.247) data 0.000 (0.007) loss 1.2565 (1.7571) lr 1.0628e-03 eta 0:16:57
epoch [30/50] batch [100/200] time 0.242 (0.246) data 0.000 (0.005) loss 1.4953 (1.7941) lr 1.0628e-03 eta 0:16:46
epoch [30/50] batch [120/200] time 0.236 (0.245) data 0.000 (0.004) loss 1.5603 (1.8284) lr 1.0628e-03 eta 0:16:37
epoch [30/50] batch [140/200] time 0.242 (0.244) data 0.000 (0.004) loss 1.4096 (1.8197) lr 1.0628e-03 eta 0:16:30
epoch [30/50] batch [160/200] time 0.235 (0.244) data 0.000 (0.003) loss 0.9018 (1.8040) lr 1.0628e-03 eta 0:16:23
epoch [30/50] batch [180/200] time 0.239 (0.243) data 0.000 (0.003) loss 1.0567 (1.8123) lr 1.0628e-03 eta 0:16:17
epoch [30/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.4052 (1.8091) lr 1.0000e-03 eta 0:16:11
epoch [31/50] batch [20/200] time 0.237 (0.266) data 0.000 (0.026) loss 1.3301 (1.7102) lr 1.0000e-03 eta 0:17:37
epoch [31/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 3.3526 (1.7509) lr 1.0000e-03 eta 0:16:41
epoch [31/50] batch [60/200] time 0.243 (0.249) data 0.000 (0.009) loss 2.2017 (1.7341) lr 1.0000e-03 eta 0:16:19
epoch [31/50] batch [80/200] time 0.241 (0.246) data 0.000 (0.007) loss 1.5587 (1.7069) lr 1.0000e-03 eta 0:16:06
epoch [31/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 1.8126 (1.7100) lr 1.0000e-03 eta 0:15:56
epoch [31/50] batch [120/200] time 0.243 (0.244) data 0.000 (0.004) loss 2.1257 (1.7231) lr 1.0000e-03 eta 0:15:48
epoch [31/50] batch [140/200] time 0.238 (0.244) data 0.000 (0.004) loss 1.7749 (1.7623) lr 1.0000e-03 eta 0:15:41
epoch [31/50] batch [160/200] time 0.245 (0.244) data 0.000 (0.003) loss 2.9399 (1.7498) lr 1.0000e-03 eta 0:15:35
epoch [31/50] batch [180/200] time 0.241 (0.243) data 0.000 (0.003) loss 3.1637 (1.7627) lr 1.0000e-03 eta 0:15:29
epoch [31/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.4426 (1.7965) lr 9.3721e-04 eta 0:15:24
epoch [32/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 2.4980 (1.8685) lr 9.3721e-04 eta 0:16:43
epoch [32/50] batch [40/200] time 0.242 (0.254) data 0.000 (0.012) loss 0.9618 (1.7349) lr 9.3721e-04 eta 0:15:53
epoch [32/50] batch [60/200] time 0.237 (0.249) data 0.000 (0.008) loss 2.3806 (1.7288) lr 9.3721e-04 eta 0:15:33
epoch [32/50] batch [80/200] time 0.240 (0.247) data 0.000 (0.006) loss 1.8206 (1.7713) lr 9.3721e-04 eta 0:15:19
epoch [32/50] batch [100/200] time 0.245 (0.246) data 0.000 (0.005) loss 1.7729 (1.7494) lr 9.3721e-04 eta 0:15:10
epoch [32/50] batch [120/200] time 0.236 (0.245) data 0.000 (0.004) loss 1.5557 (1.7713) lr 9.3721e-04 eta 0:15:02
epoch [32/50] batch [140/200] time 0.243 (0.245) data 0.004 (0.004) loss 2.2397 (1.7925) lr 9.3721e-04 eta 0:14:55
epoch [32/50] batch [160/200] time 0.242 (0.244) data 0.000 (0.003) loss 1.1560 (1.7896) lr 9.3721e-04 eta 0:14:48
epoch [32/50] batch [180/200] time 0.243 (0.244) data 0.000 (0.003) loss 1.9455 (1.7735) lr 9.3721e-04 eta 0:14:42
epoch [32/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.4110 (1.7840) lr 8.7467e-04 eta 0:14:36
epoch [33/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 2.2072 (1.6990) lr 8.7467e-04 eta 0:15:51
epoch [33/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 2.4977 (1.7740) lr 8.7467e-04 eta 0:14:59
epoch [33/50] batch [60/200] time 0.243 (0.249) data 0.000 (0.009) loss 2.0691 (1.6971) lr 8.7467e-04 eta 0:14:39
epoch [33/50] batch [80/200] time 0.236 (0.247) data 0.000 (0.006) loss 1.2841 (1.7721) lr 8.7467e-04 eta 0:14:28
epoch [33/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 1.2639 (1.7132) lr 8.7467e-04 eta 0:14:19
epoch [33/50] batch [120/200] time 0.235 (0.245) data 0.000 (0.004) loss 1.1910 (1.7436) lr 8.7467e-04 eta 0:14:11
epoch [33/50] batch [140/200] time 0.242 (0.244) data 0.000 (0.004) loss 1.5213 (1.7456) lr 8.7467e-04 eta 0:14:04
epoch [33/50] batch [160/200] time 0.235 (0.244) data 0.000 (0.003) loss 2.1918 (1.7600) lr 8.7467e-04 eta 0:13:58
epoch [33/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.1283 (1.7795) lr 8.7467e-04 eta 0:13:52
epoch [33/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.5568 (1.7734) lr 8.1262e-04 eta 0:13:46
epoch [34/50] batch [20/200] time 0.243 (0.267) data 0.000 (0.026) loss 1.5927 (1.8794) lr 8.1262e-04 eta 0:15:03
epoch [34/50] batch [40/200] time 0.237 (0.254) data 0.000 (0.013) loss 1.0662 (1.8801) lr 8.1262e-04 eta 0:14:14
epoch [34/50] batch [60/200] time 0.237 (0.250) data 0.000 (0.009) loss 1.4826 (1.7899) lr 8.1262e-04 eta 0:13:54
epoch [34/50] batch [80/200] time 0.240 (0.247) data 0.000 (0.007) loss 1.5741 (1.8125) lr 8.1262e-04 eta 0:13:41
epoch [34/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 2.2985 (1.8069) lr 8.1262e-04 eta 0:13:31
epoch [34/50] batch [120/200] time 0.240 (0.245) data 0.000 (0.004) loss 1.9377 (1.8344) lr 8.1262e-04 eta 0:13:23
epoch [34/50] batch [140/200] time 0.243 (0.245) data 0.000 (0.004) loss 1.4528 (1.8078) lr 8.1262e-04 eta 0:13:17
epoch [34/50] batch [160/200] time 0.240 (0.244) data 0.000 (0.003) loss 2.3091 (1.8476) lr 8.1262e-04 eta 0:13:10
epoch [34/50] batch [180/200] time 0.242 (0.244) data 0.000 (0.003) loss 2.4114 (1.8374) lr 8.1262e-04 eta 0:13:04
epoch [34/50] batch [200/200] time 0.236 (0.243) data 0.000 (0.003) loss 3.2723 (1.8506) lr 7.5131e-04 eta 0:12:58
epoch [35/50] batch [20/200] time 0.240 (0.266) data 0.000 (0.026) loss 1.7091 (1.6880) lr 7.5131e-04 eta 0:14:05
epoch [35/50] batch [40/200] time 0.237 (0.253) data 0.000 (0.013) loss 2.4430 (1.7086) lr 7.5131e-04 eta 0:13:19
epoch [35/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.009) loss 1.0252 (1.7058) lr 7.5131e-04 eta 0:13:01
epoch [35/50] batch [80/200] time 0.241 (0.247) data 0.000 (0.007) loss 1.1598 (1.7613) lr 7.5131e-04 eta 0:12:49
epoch [35/50] batch [100/200] time 0.243 (0.245) data 0.000 (0.005) loss 1.4297 (1.7901) lr 7.5131e-04 eta 0:12:40
epoch [35/50] batch [120/200] time 0.247 (0.245) data 0.000 (0.004) loss 3.2672 (1.8017) lr 7.5131e-04 eta 0:12:33
epoch [35/50] batch [140/200] time 0.240 (0.244) data 0.000 (0.004) loss 1.1795 (1.8007) lr 7.5131e-04 eta 0:12:26
epoch [35/50] batch [160/200] time 0.246 (0.243) data 0.000 (0.003) loss 1.1320 (1.8062) lr 7.5131e-04 eta 0:12:19
epoch [35/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 2.0226 (1.7992) lr 7.5131e-04 eta 0:12:13
epoch [35/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.5000 (1.8020) lr 6.9098e-04 eta 0:12:08
epoch [36/50] batch [20/200] time 0.241 (0.265) data 0.000 (0.025) loss 1.2256 (1.5984) lr 6.9098e-04 eta 0:13:09
epoch [36/50] batch [40/200] time 0.241 (0.252) data 0.000 (0.013) loss 2.3077 (1.7102) lr 6.9098e-04 eta 0:12:27
epoch [36/50] batch [60/200] time 0.236 (0.248) data 0.000 (0.008) loss 2.1903 (1.7756) lr 6.9098e-04 eta 0:12:09
epoch [36/50] batch [80/200] time 0.242 (0.246) data 0.000 (0.006) loss 1.7948 (1.7518) lr 6.9098e-04 eta 0:11:58
epoch [36/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 2.0096 (1.7031) lr 6.9098e-04 eta 0:11:49
epoch [36/50] batch [120/200] time 0.239 (0.244) data 0.000 (0.004) loss 1.5997 (1.7337) lr 6.9098e-04 eta 0:11:42
epoch [36/50] batch [140/200] time 0.236 (0.243) data 0.000 (0.004) loss 1.8187 (1.7264) lr 6.9098e-04 eta 0:11:36
epoch [36/50] batch [160/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.9053 (1.7279) lr 6.9098e-04 eta 0:11:30
epoch [36/50] batch [180/200] time 0.240 (0.243) data 0.000 (0.003) loss 2.2828 (1.7350) lr 6.9098e-04 eta 0:11:24
epoch [36/50] batch [200/200] time 0.241 (0.242) data 0.000 (0.003) loss 2.6325 (1.7555) lr 6.3188e-04 eta 0:11:18
epoch [37/50] batch [20/200] time 0.237 (0.266) data 0.000 (0.025) loss 1.3183 (1.7654) lr 6.3188e-04 eta 0:12:19
epoch [37/50] batch [40/200] time 0.237 (0.253) data 0.000 (0.013) loss 1.3197 (1.7421) lr 6.3188e-04 eta 0:11:38
epoch [37/50] batch [60/200] time 0.243 (0.249) data 0.001 (0.009) loss 1.8703 (1.7329) lr 6.3188e-04 eta 0:11:22
epoch [37/50] batch [80/200] time 0.236 (0.247) data 0.000 (0.006) loss 1.1045 (1.7686) lr 6.3188e-04 eta 0:11:11
epoch [37/50] batch [100/200] time 0.241 (0.246) data 0.000 (0.005) loss 1.5894 (1.7930) lr 6.3188e-04 eta 0:11:03
epoch [37/50] batch [120/200] time 0.242 (0.245) data 0.000 (0.004) loss 2.4845 (1.7978) lr 6.3188e-04 eta 0:10:55
epoch [37/50] batch [140/200] time 0.236 (0.244) data 0.000 (0.004) loss 0.6897 (1.8056) lr 6.3188e-04 eta 0:10:48
epoch [37/50] batch [160/200] time 0.238 (0.243) data 0.000 (0.003) loss 1.7697 (1.8115) lr 6.3188e-04 eta 0:10:42
epoch [37/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.8388 (1.8278) lr 6.3188e-04 eta 0:10:36
epoch [37/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.4056 (1.8336) lr 5.7422e-04 eta 0:10:30
epoch [38/50] batch [20/200] time 0.242 (0.265) data 0.000 (0.024) loss 1.0117 (1.7249) lr 5.7422e-04 eta 0:11:23
epoch [38/50] batch [40/200] time 0.242 (0.252) data 0.000 (0.012) loss 1.8232 (1.7096) lr 5.7422e-04 eta 0:10:44
epoch [38/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.008) loss 2.7137 (1.6978) lr 5.7422e-04 eta 0:10:31
epoch [38/50] batch [80/200] time 0.242 (0.247) data 0.000 (0.006) loss 2.6460 (1.7274) lr 5.7422e-04 eta 0:10:21
epoch [38/50] batch [100/200] time 0.235 (0.245) data 0.000 (0.005) loss 1.4919 (1.7120) lr 5.7422e-04 eta 0:10:13
epoch [38/50] batch [120/200] time 0.236 (0.244) data 0.000 (0.004) loss 1.0956 (1.6837) lr 5.7422e-04 eta 0:10:06
epoch [38/50] batch [140/200] time 0.234 (0.244) data 0.000 (0.004) loss 1.3668 (1.6875) lr 5.7422e-04 eta 0:10:00
epoch [38/50] batch [160/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.9644 (1.6956) lr 5.7422e-04 eta 0:09:54
epoch [38/50] batch [180/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.9784 (1.7118) lr 5.7422e-04 eta 0:09:48
epoch [38/50] batch [200/200] time 0.237 (0.243) data 0.000 (0.003) loss 2.1645 (1.7157) lr 5.1825e-04 eta 0:09:42
epoch [39/50] batch [20/200] time 0.240 (0.265) data 0.000 (0.025) loss 2.2495 (1.8940) lr 5.1825e-04 eta 0:10:30
epoch [39/50] batch [40/200] time 0.242 (0.253) data 0.000 (0.013) loss 1.5090 (1.8263) lr 5.1825e-04 eta 0:09:58
epoch [39/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.008) loss 1.7496 (1.8472) lr 5.1825e-04 eta 0:09:43
epoch [39/50] batch [80/200] time 0.242 (0.247) data 0.000 (0.006) loss 1.6011 (1.8040) lr 5.1825e-04 eta 0:09:33
epoch [39/50] batch [100/200] time 0.240 (0.246) data 0.000 (0.005) loss 2.0659 (1.8072) lr 5.1825e-04 eta 0:09:25
epoch [39/50] batch [120/200] time 0.242 (0.245) data 0.000 (0.004) loss 3.4164 (1.7713) lr 5.1825e-04 eta 0:09:18
epoch [39/50] batch [140/200] time 0.233 (0.244) data 0.000 (0.004) loss 2.4961 (1.7676) lr 5.1825e-04 eta 0:09:11
epoch [39/50] batch [160/200] time 0.240 (0.244) data 0.000 (0.003) loss 1.9742 (1.7471) lr 5.1825e-04 eta 0:09:05
epoch [39/50] batch [180/200] time 0.251 (0.243) data 0.000 (0.003) loss 1.6119 (1.7525) lr 5.1825e-04 eta 0:08:59
epoch [39/50] batch [200/200] time 0.235 (0.243) data 0.000 (0.003) loss 2.4116 (1.7739) lr 4.6417e-04 eta 0:08:54
epoch [40/50] batch [20/200] time 0.241 (0.265) data 0.000 (0.025) loss 2.1884 (1.4973) lr 4.6417e-04 eta 0:09:36
epoch [40/50] batch [40/200] time 0.250 (0.252) data 0.000 (0.013) loss 2.1829 (1.6755) lr 4.6417e-04 eta 0:09:05
epoch [40/50] batch [60/200] time 0.241 (0.248) data 0.000 (0.009) loss 1.5438 (1.6790) lr 4.6417e-04 eta 0:08:51
epoch [40/50] batch [80/200] time 0.244 (0.246) data 0.000 (0.006) loss 2.4151 (1.6963) lr 4.6417e-04 eta 0:08:41
epoch [40/50] batch [100/200] time 0.239 (0.245) data 0.000 (0.005) loss 0.5711 (1.6765) lr 4.6417e-04 eta 0:08:34
epoch [40/50] batch [120/200] time 0.237 (0.244) data 0.000 (0.004) loss 1.7363 (1.6963) lr 4.6417e-04 eta 0:08:27
epoch [40/50] batch [140/200] time 0.242 (0.244) data 0.000 (0.004) loss 2.8808 (1.7215) lr 4.6417e-04 eta 0:08:21
epoch [40/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 0.7297 (1.7198) lr 4.6417e-04 eta 0:08:15
epoch [40/50] batch [180/200] time 0.241 (0.243) data 0.000 (0.003) loss 0.8223 (1.7421) lr 4.6417e-04 eta 0:08:10
epoch [40/50] batch [200/200] time 0.242 (0.242) data 0.000 (0.003) loss 1.0625 (1.7149) lr 4.1221e-04 eta 0:08:04
epoch [41/50] batch [20/200] time 0.242 (0.267) data 0.000 (0.027) loss 1.4869 (1.6098) lr 4.1221e-04 eta 0:08:48
epoch [41/50] batch [40/200] time 0.241 (0.254) data 0.000 (0.014) loss 1.3789 (1.6302) lr 4.1221e-04 eta 0:08:17
epoch [41/50] batch [60/200] time 0.240 (0.250) data 0.000 (0.009) loss 1.8884 (1.7162) lr 4.1221e-04 eta 0:08:04
epoch [41/50] batch [80/200] time 0.233 (0.247) data 0.000 (0.007) loss 1.1338 (1.6824) lr 4.1221e-04 eta 0:07:54
epoch [41/50] batch [100/200] time 0.237 (0.246) data 0.000 (0.006) loss 1.5172 (1.6722) lr 4.1221e-04 eta 0:07:46
epoch [41/50] batch [120/200] time 0.242 (0.245) data 0.000 (0.005) loss 1.9913 (1.7045) lr 4.1221e-04 eta 0:07:39
epoch [41/50] batch [140/200] time 0.236 (0.244) data 0.000 (0.004) loss 0.5999 (1.6962) lr 4.1221e-04 eta 0:07:33
epoch [41/50] batch [160/200] time 0.239 (0.243) data 0.000 (0.004) loss 2.8870 (1.7255) lr 4.1221e-04 eta 0:07:27
epoch [41/50] batch [180/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.3590 (1.7082) lr 4.1221e-04 eta 0:07:22
epoch [41/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 2.1320 (1.7296) lr 3.6258e-04 eta 0:07:17
epoch [42/50] batch [20/200] time 0.240 (0.265) data 0.000 (0.025) loss 1.3101 (1.7068) lr 3.6258e-04 eta 0:07:51
epoch [42/50] batch [40/200] time 0.243 (0.253) data 0.000 (0.013) loss 0.9906 (1.7194) lr 3.6258e-04 eta 0:07:25
epoch [42/50] batch [60/200] time 0.239 (0.249) data 0.000 (0.009) loss 2.2657 (1.7282) lr 3.6258e-04 eta 0:07:12
epoch [42/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 1.5431 (1.7653) lr 3.6258e-04 eta 0:07:03
epoch [42/50] batch [100/200] time 0.240 (0.245) data 0.000 (0.005) loss 1.8946 (1.7515) lr 3.6258e-04 eta 0:06:56
epoch [42/50] batch [120/200] time 0.240 (0.244) data 0.000 (0.004) loss 2.4861 (1.7853) lr 3.6258e-04 eta 0:06:49
epoch [42/50] batch [140/200] time 0.240 (0.243) data 0.000 (0.004) loss 1.8647 (1.7875) lr 3.6258e-04 eta 0:06:43
epoch [42/50] batch [160/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.8516 (1.8083) lr 3.6258e-04 eta 0:06:38
epoch [42/50] batch [180/200] time 0.237 (0.242) data 0.000 (0.003) loss 2.2684 (1.7943) lr 3.6258e-04 eta 0:06:32
epoch [42/50] batch [200/200] time 0.241 (0.242) data 0.000 (0.003) loss 2.1030 (1.7981) lr 3.1545e-04 eta 0:06:27
epoch [43/50] batch [20/200] time 0.242 (0.265) data 0.000 (0.025) loss 1.4708 (1.6880) lr 3.1545e-04 eta 0:06:58
epoch [43/50] batch [40/200] time 0.237 (0.253) data 0.000 (0.013) loss 2.1557 (1.7368) lr 3.1545e-04 eta 0:06:34
epoch [43/50] batch [60/200] time 0.238 (0.248) data 0.000 (0.009) loss 0.3115 (1.7178) lr 3.1545e-04 eta 0:06:22
epoch [43/50] batch [80/200] time 0.242 (0.246) data 0.000 (0.006) loss 1.0357 (1.7854) lr 3.1545e-04 eta 0:06:14
epoch [43/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 1.1945 (1.7296) lr 3.1545e-04 eta 0:06:07
epoch [43/50] batch [120/200] time 0.248 (0.244) data 0.000 (0.004) loss 2.1593 (1.7284) lr 3.1545e-04 eta 0:06:01
epoch [43/50] batch [140/200] time 0.243 (0.244) data 0.000 (0.004) loss 2.2070 (1.7116) lr 3.1545e-04 eta 0:05:56
epoch [43/50] batch [160/200] time 0.240 (0.243) data 0.000 (0.003) loss 1.5821 (1.6981) lr 3.1545e-04 eta 0:05:50
epoch [43/50] batch [180/200] time 0.240 (0.243) data 0.000 (0.003) loss 1.1709 (1.6956) lr 3.1545e-04 eta 0:05:45
epoch [43/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 2.0929 (1.7131) lr 2.7103e-04 eta 0:05:39
epoch [44/50] batch [20/200] time 0.243 (0.266) data 0.000 (0.025) loss 2.3340 (1.8131) lr 2.7103e-04 eta 0:06:06
epoch [44/50] batch [40/200] time 0.248 (0.253) data 0.000 (0.013) loss 1.9421 (1.7760) lr 2.7103e-04 eta 0:05:44
epoch [44/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.009) loss 1.1086 (1.8057) lr 2.7103e-04 eta 0:05:33
epoch [44/50] batch [80/200] time 0.242 (0.247) data 0.000 (0.006) loss 1.6250 (1.8194) lr 2.7103e-04 eta 0:05:25
epoch [44/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 2.4682 (1.7941) lr 2.7103e-04 eta 0:05:19
epoch [44/50] batch [120/200] time 0.235 (0.245) data 0.000 (0.004) loss 1.8302 (1.7507) lr 2.7103e-04 eta 0:05:12
epoch [44/50] batch [140/200] time 0.239 (0.244) data 0.000 (0.004) loss 2.8551 (1.7659) lr 2.7103e-04 eta 0:05:07
epoch [44/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.0632 (1.7693) lr 2.7103e-04 eta 0:05:01
epoch [44/50] batch [180/200] time 0.243 (0.243) data 0.000 (0.003) loss 3.0174 (1.7717) lr 2.7103e-04 eta 0:04:56
epoch [44/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.1840 (1.7748) lr 2.2949e-04 eta 0:04:51
epoch [45/50] batch [20/200] time 0.235 (0.264) data 0.000 (0.025) loss 2.3277 (1.8597) lr 2.2949e-04 eta 0:05:11
epoch [45/50] batch [40/200] time 0.241 (0.252) data 0.000 (0.013) loss 1.4885 (1.7948) lr 2.2949e-04 eta 0:04:52
epoch [45/50] batch [60/200] time 0.237 (0.248) data 0.000 (0.009) loss 0.3741 (1.8382) lr 2.2949e-04 eta 0:04:42
epoch [45/50] batch [80/200] time 0.234 (0.246) data 0.000 (0.007) loss 1.4487 (1.7716) lr 2.2949e-04 eta 0:04:35
epoch [45/50] batch [100/200] time 0.240 (0.245) data 0.000 (0.005) loss 0.9388 (1.7369) lr 2.2949e-04 eta 0:04:28
epoch [45/50] batch [120/200] time 0.237 (0.244) data 0.000 (0.004) loss 2.0764 (1.7169) lr 2.2949e-04 eta 0:04:23
epoch [45/50] batch [140/200] time 0.241 (0.243) data 0.000 (0.004) loss 1.8364 (1.7533) lr 2.2949e-04 eta 0:04:17
epoch [45/50] batch [160/200] time 0.242 (0.243) data 0.000 (0.003) loss 1.6225 (1.7493) lr 2.2949e-04 eta 0:04:12
epoch [45/50] batch [180/200] time 0.237 (0.242) data 0.002 (0.003) loss 0.7342 (1.7699) lr 2.2949e-04 eta 0:04:07
epoch [45/50] batch [200/200] time 0.241 (0.242) data 0.000 (0.003) loss 1.9248 (1.7621) lr 1.9098e-04 eta 0:04:02
epoch [46/50] batch [20/200] time 0.241 (0.265) data 0.000 (0.025) loss 3.2836 (1.8333) lr 1.9098e-04 eta 0:04:19
epoch [46/50] batch [40/200] time 0.244 (0.252) data 0.000 (0.013) loss 1.8023 (1.8123) lr 1.9098e-04 eta 0:04:01
epoch [46/50] batch [60/200] time 0.237 (0.248) data 0.000 (0.008) loss 0.6552 (1.8129) lr 1.9098e-04 eta 0:03:53
epoch [46/50] batch [80/200] time 0.243 (0.246) data 0.000 (0.006) loss 2.3622 (1.7728) lr 1.9098e-04 eta 0:03:46
epoch [46/50] batch [100/200] time 0.239 (0.245) data 0.000 (0.005) loss 0.9787 (1.7325) lr 1.9098e-04 eta 0:03:40
epoch [46/50] batch [120/200] time 0.241 (0.244) data 0.000 (0.004) loss 1.6922 (1.7112) lr 1.9098e-04 eta 0:03:34
epoch [46/50] batch [140/200] time 0.243 (0.244) data 0.000 (0.004) loss 1.4489 (1.7441) lr 1.9098e-04 eta 0:03:29
epoch [46/50] batch [160/200] time 0.237 (0.243) data 0.000 (0.003) loss 1.3850 (1.7660) lr 1.9098e-04 eta 0:03:24
epoch [46/50] batch [180/200] time 0.239 (0.243) data 0.000 (0.003) loss 0.8530 (1.7625) lr 1.9098e-04 eta 0:03:19
epoch [46/50] batch [200/200] time 0.242 (0.242) data 0.000 (0.003) loss 1.0566 (1.7666) lr 1.5567e-04 eta 0:03:13
epoch [47/50] batch [20/200] time 0.242 (0.268) data 0.000 (0.028) loss 1.3466 (1.7488) lr 1.5567e-04 eta 0:03:29
epoch [47/50] batch [40/200] time 0.246 (0.255) data 0.000 (0.014) loss 1.8009 (1.7985) lr 1.5567e-04 eta 0:03:13
epoch [47/50] batch [60/200] time 0.243 (0.250) data 0.000 (0.009) loss 2.1361 (1.7501) lr 1.5567e-04 eta 0:03:04
epoch [47/50] batch [80/200] time 0.243 (0.248) data 0.000 (0.007) loss 2.5550 (1.7573) lr 1.5567e-04 eta 0:02:58
epoch [47/50] batch [100/200] time 0.236 (0.246) data 0.000 (0.006) loss 2.2333 (1.7289) lr 1.5567e-04 eta 0:02:52
epoch [47/50] batch [120/200] time 0.242 (0.245) data 0.000 (0.005) loss 1.9480 (1.7182) lr 1.5567e-04 eta 0:02:46
epoch [47/50] batch [140/200] time 0.234 (0.245) data 0.000 (0.004) loss 0.8321 (1.7202) lr 1.5567e-04 eta 0:02:41
epoch [47/50] batch [160/200] time 0.258 (0.244) data 0.000 (0.004) loss 3.0945 (1.7392) lr 1.5567e-04 eta 0:02:36
epoch [47/50] batch [180/200] time 0.239 (0.244) data 0.000 (0.003) loss 2.2732 (1.7159) lr 1.5567e-04 eta 0:02:31
epoch [47/50] batch [200/200] time 0.246 (0.243) data 0.000 (0.003) loss 2.4869 (1.7257) lr 1.2369e-04 eta 0:02:25
epoch [48/50] batch [20/200] time 0.242 (0.264) data 0.000 (0.025) loss 1.4806 (1.8357) lr 1.2369e-04 eta 0:02:33
epoch [48/50] batch [40/200] time 0.242 (0.252) data 0.000 (0.012) loss 1.4942 (1.8073) lr 1.2369e-04 eta 0:02:21
epoch [48/50] batch [60/200] time 0.241 (0.248) data 0.000 (0.008) loss 1.0452 (1.7211) lr 1.2369e-04 eta 0:02:13
epoch [48/50] batch [80/200] time 0.245 (0.246) data 0.000 (0.006) loss 2.1902 (1.7834) lr 1.2369e-04 eta 0:02:07
epoch [48/50] batch [100/200] time 0.243 (0.245) data 0.000 (0.005) loss 1.9526 (1.7743) lr 1.2369e-04 eta 0:02:02
epoch [48/50] batch [120/200] time 0.239 (0.244) data 0.000 (0.004) loss 1.2251 (1.7605) lr 1.2369e-04 eta 0:01:57
epoch [48/50] batch [140/200] time 0.242 (0.243) data 0.000 (0.004) loss 1.7170 (1.7591) lr 1.2369e-04 eta 0:01:51
epoch [48/50] batch [160/200] time 0.248 (0.243) data 0.011 (0.003) loss 2.3112 (1.7687) lr 1.2369e-04 eta 0:01:46
epoch [48/50] batch [180/200] time 0.236 (0.243) data 0.000 (0.003) loss 2.6287 (1.7738) lr 1.2369e-04 eta 0:01:42
epoch [48/50] batch [200/200] time 0.241 (0.243) data 0.000 (0.003) loss 1.4391 (1.7594) lr 9.5173e-05 eta 0:01:37
epoch [49/50] batch [20/200] time 0.240 (0.264) data 0.000 (0.025) loss 0.6945 (1.5895) lr 9.5173e-05 eta 0:01:40
epoch [49/50] batch [40/200] time 0.242 (0.252) data 0.000 (0.013) loss 2.0215 (1.7819) lr 9.5173e-05 eta 0:01:30
epoch [49/50] batch [60/200] time 0.241 (0.248) data 0.000 (0.008) loss 2.7988 (1.7600) lr 9.5173e-05 eta 0:01:24
epoch [49/50] batch [80/200] time 0.236 (0.246) data 0.000 (0.006) loss 1.9146 (1.7406) lr 9.5173e-05 eta 0:01:18
epoch [49/50] batch [100/200] time 0.236 (0.245) data 0.000 (0.005) loss 1.4613 (1.7444) lr 9.5173e-05 eta 0:01:13
epoch [49/50] batch [120/200] time 0.240 (0.244) data 0.000 (0.004) loss 1.6715 (1.7392) lr 9.5173e-05 eta 0:01:08
epoch [49/50] batch [140/200] time 0.243 (0.244) data 0.000 (0.004) loss 2.2460 (1.7451) lr 9.5173e-05 eta 0:01:03
epoch [49/50] batch [160/200] time 0.236 (0.243) data 0.000 (0.003) loss 1.2746 (1.7508) lr 9.5173e-05 eta 0:00:58
epoch [49/50] batch [180/200] time 0.240 (0.243) data 0.000 (0.003) loss 1.8940 (1.7377) lr 9.5173e-05 eta 0:00:53
epoch [49/50] batch [200/200] time 0.234 (0.243) data 0.000 (0.003) loss 1.4538 (1.7300) lr 7.0224e-05 eta 0:00:48
epoch [50/50] batch [20/200] time 0.242 (0.266) data 0.000 (0.025) loss 2.2822 (1.9853) lr 7.0224e-05 eta 0:00:47
epoch [50/50] batch [40/200] time 0.241 (0.253) data 0.000 (0.012) loss 1.7401 (1.7469) lr 7.0224e-05 eta 0:00:40
epoch [50/50] batch [60/200] time 0.242 (0.249) data 0.000 (0.008) loss 2.0091 (1.7775) lr 7.0224e-05 eta 0:00:34
epoch [50/50] batch [80/200] time 0.242 (0.247) data 0.000 (0.006) loss 1.5498 (1.7456) lr 7.0224e-05 eta 0:00:29
epoch [50/50] batch [100/200] time 0.242 (0.245) data 0.000 (0.005) loss 1.4594 (1.7298) lr 7.0224e-05 eta 0:00:24
epoch [50/50] batch [120/200] time 0.239 (0.245) data 0.000 (0.004) loss 1.4138 (1.7363) lr 7.0224e-05 eta 0:00:19
epoch [50/50] batch [140/200] time 0.236 (0.244) data 0.000 (0.004) loss 1.6181 (1.7486) lr 7.0224e-05 eta 0:00:14
epoch [50/50] batch [160/200] time 0.240 (0.244) data 0.000 (0.003) loss 1.6103 (1.7570) lr 7.0224e-05 eta 0:00:09
epoch [50/50] batch [180/200] time 0.257 (0.243) data 0.000 (0.003) loss 1.7493 (1.7729) lr 7.0224e-05 eta 0:00:04
epoch [50/50] batch [200/200] time 0.242 (0.243) data 0.000 (0.003) loss 3.0693 (1.7692) lr 4.8943e-05 eta 0:00:00
Checkpoint saved to output/base2new/train_base/fgvc_aircraft/vit_b16_ep50_c4_BZ4_ProDA/seed3/prompt_learner/model.pth.tar-50
Finish training
Deploy the last-epoch model
Evaluate on the *test* set
=> result
* total: 1,670
* correct: 867
* accuracy: 51.92%
* error: 48.08%
* macro_f1: 50.14%
Elapsed: 0:41:21
