2023-11-02 14:11:03   INFO  **********************Start logging**********************
2023-11-02 14:11:03   INFO  CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
2023-11-02 14:11:03   INFO  cfg_file         cfgs/picture_models/picture_waymo_ssl_seal_decoder_mask_0.2.yaml
2023-11-02 14:11:03   INFO  batch_size       3
2023-11-02 14:11:03   INFO  epochs           30
2023-11-02 14:11:03   INFO  workers          4
2023-11-02 14:11:03   INFO  extra_tag        offline_30e
2023-11-02 14:11:03   INFO  ckpt             None
2023-11-02 14:11:03   INFO  pretrained_model None
2023-11-02 14:11:03   INFO  launcher         none
2023-11-02 14:11:03   INFO  tcp_port         18888
2023-11-02 14:11:03   INFO  sync_bn          False
2023-11-02 14:11:03   INFO  fix_random_seed  False
2023-11-02 14:11:03   INFO  ckpt_save_interval 1
2023-11-02 14:11:03   INFO  local_rank       0
2023-11-02 14:11:03   INFO  max_ckpt_save_num 1
2023-11-02 14:11:03   INFO  merge_all_iters_to_one_epoch False
2023-11-02 14:11:03   INFO  set_cfgs         None
2023-11-02 14:11:03   INFO  max_waiting_mins 0
2023-11-02 14:11:03   INFO  start_epoch      0
2023-11-02 14:11:03   INFO  num_epochs_to_eval 0
2023-11-02 14:11:03   INFO  save_to_file     False
2023-11-02 14:11:03   INFO  use_tqdm_to_record False
2023-11-02 14:11:03   INFO  logger_iter_interval 50
2023-11-02 14:11:03   INFO  ckpt_save_time_interval 300
2023-11-02 14:11:03   INFO  wo_gpu_stat      False
2023-11-02 14:11:03   INFO  fp16             False
2023-11-02 14:11:03   INFO  cfg.LOCAL_RANK: 0
2023-11-02 14:11:03   INFO  
cfg.DATA_CONFIG = edict()
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATASET: WaymoDataset
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATA_PATH: ../data/waymo
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.PROCESSED_DATA_TAG: waymo_processed_data_v0_5_0
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.POINT_CLOUD_RANGE: [-74.88, -74.88, -2, 74.88, 74.88, 4.0]
2023-11-02 14:11:03   INFO  
cfg.DATA_CONFIG.DATA_SPLIT = edict()
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATA_SPLIT.train: train
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATA_SPLIT.test: val
2023-11-02 14:11:03   INFO  
cfg.DATA_CONFIG.SAMPLED_INTERVAL = edict()
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.SAMPLED_INTERVAL.train: 5
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.SAMPLED_INTERVAL.test: 1
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.FILTER_EMPTY_BOXES_FOR_TRAIN: True
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DISABLE_NLZ_FLAG_ON_POINTS: True
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.USE_SHARED_MEMORY: False
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.SHARED_MEMORY_FILE_LIMIT: 35000
2023-11-02 14:11:03   INFO  
cfg.DATA_CONFIG.DATA_AUGMENTOR = edict()
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATA_AUGMENTOR.DISABLE_AUG_LIST: ['placeholder']
2023-11-02 14:11:03   INFO  
cfg.DATA_CONFIG.POINT_FEATURE_ENCODING = edict()
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.POINT_FEATURE_ENCODING.encoding_type: absolute_coordinates_encoding
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.POINT_FEATURE_ENCODING.used_feature_list: ['x', 'y', 'z', 'intensity', 'elongation']
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.POINT_FEATURE_ENCODING.src_feature_list: ['x', 'y', 'z', 'intensity', 'elongation']
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG.DATA_PROCESSOR: [{'NAME': 'mask_points_and_boxes_outside_range', 'REMOVE_OUTSIDE_BOXES': True}, {'NAME': 'shuffle_points', 'SHUFFLE_ENABLED': {'train': True, 'test': False}}, {'NAME': 'transform_points_to_voxels_placeholder', 'VOXEL_SIZE': [0.32, 0.32, 6]}]
2023-11-02 14:11:03   INFO  cfg.DATA_CONFIG._BASE_CONFIG_: cfgs/dataset_configs/waymo_dataset.yaml
2023-11-02 14:11:03   INFO  
cfg.MODEL = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.NAME: PICTURE
2023-11-02 14:11:03   INFO  
cfg.MODEL.VFE = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.VFE.NAME: DynPillarVFE3D
2023-11-02 14:11:03   INFO  cfg.MODEL.VFE.WITH_DISTANCE: False
2023-11-02 14:11:03   INFO  cfg.MODEL.VFE.USE_ABSLOTE_XYZ: True
2023-11-02 14:11:03   INFO  cfg.MODEL.VFE.USE_NORM: True
2023-11-02 14:11:03   INFO  cfg.MODEL.VFE.NUM_FILTERS: [192, 192]
2023-11-02 14:11:03   INFO  
cfg.MODEL.BACKBONE_3D = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.NAME: DSVTBackboneMAE
2023-11-02 14:11:03   INFO  
cfg.MODEL.BACKBONE_3D.INPUT_LAYER = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.sparse_shape: [ 468, 468, 32 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.downsample_stride: [ [ 1, 1, 4 ], [ 1, 1, 4 ], [ 1, 1, 2 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.d_model: [ 192, 192, 192, 192 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.set_info: [ [ 48, 1 ], [ 48, 1 ], [ 48, 1 ], [ 48, 1 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.window_shape: [ [ 12, 12, 32 ], [ 12, 12, 8 ], [ 12, 12, 2 ], [ 12, 12, 1 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.hybrid_factor: [2, 2, 1]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.shifts_list: [ [ [ 0, 0, 0 ], [ 6, 6, 0 ] ], [ [ 0, 0, 0 ], [ 6, 6, 0 ] ], [ [ 0, 0, 0 ], [ 6, 6, 0 ] ], [ [ 0, 0, 0 ], [ 6, 6, 0 ] ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.INPUT_LAYER.normalize_pos: False
2023-11-02 14:11:03   INFO  
cfg.MODEL.BACKBONE_3D.MASK_CONFIG = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.n_clusters: 8
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.n_partition: [3, 3, 2]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.lambda_threshold: 0.6
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.base_mask_ratio: [0.9, 0.45, 0]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.NUM_SEAL_FEATURES: 64
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.MASK_CONFIG.GENERATE_MODE: offline
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.block_name: [ 'DSVTBlock','DSVTBlock','DSVTBlock','DSVTBlock' ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.set_info: [ [ 48, 1 ], [ 48, 1 ], [ 48, 1 ], [ 48, 1 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.d_model: [ 192, 192, 192, 192 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.nhead: [ 8, 8, 8, 8 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.dim_feedforward: [ 384, 384, 384, 384 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.dropout: 0.0
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.activation: gelu
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.output_shape: [468, 468]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.conv_out_channel: 192
2023-11-02 14:11:03   INFO  
cfg.MODEL.BACKBONE_2D = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.NAME: LightDecoder
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.sparse_shape: [ 468, 468, 32 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.downsample_stride: [ [ 1, 1, 4 ], [ 1, 1, 4 ], [ 1, 1, 2 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.d_model: [ 192, 192 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.set_info: [ [ 48, 1 ], [ 48, 1 ]]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.window_shape: [ [ 12, 12, 32 ], [ 12, 12, 1 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.hybrid_factor: [ 2, 2, 1 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.shifts_list: [ [ [ 0, 0, 0 ], [ 6, 6, 0 ] ], [ [ 0, 0, 0 ], [ 6, 6, 0 ] ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_LAYER.shifts_list: normalize_pos: False
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.INPUT_SHAPE: [ 468, 468, 32 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_2D.NUM_BEV_FEATURES: 192
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.block_name: [ 'DSVTBlock','DSVTBlock' ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.set_info: [ [ 48, 1 ], [ 48, 1 ] ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.d_model: [ 192, 192 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.nhead: [ 8, 8 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.dim_feedforward: [ 384, 384 ]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.dropout: 0.0
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.activation: gelu
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.output_shape: [468, 468]
2023-11-02 14:11:03   INFO  cfg.MODEL.BACKBONE_3D.conv_out_channel: 192
2023-11-02 14:11:03   INFO  
cfg.MODEL.DENSE_HEAD = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.NAME: PretrainHead3D
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.CLASS_AGNOSTIC: False
2023-11-02 14:11:03   INFO  
cfg.MODEL.DENSE_HEAD.MASK_CONFIG = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.MASK_CONFIG.NUM_PRD_POINTS: 16
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.MASK_CONFIG.NUM_GT_POINTS: 64
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.INPUT_SHAPE: [468, 468, 32]
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.NUM_MINK_FEATURES: 64
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.LOSS_WEIGHT: [1.0, 3.0]
2023-11-02 14:11:03   INFO  cfg.MODEL.DENSE_HEAD.GENERATE_MODE: offline
2023-11-02 14:11:03   INFO  
cfg.MODEL.POST_PROCESSING = edict()
2023-11-02 14:11:03   INFO  cfg.MODEL.POST_PROCESSING: None
2023-11-02 14:11:03   INFO  
cfg.OPTIMIZATION = edict()
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.BATCH_SIZE_PER_GPU: 3
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.NUM_EPOCHS: 30
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.OPTIMIZER: adamw
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.LR: 0.001
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.WEIGHT_DECAY: 0.05
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.MOMENTUM: 0.9
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.MOMS: [0.95, 0.85]
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.PCT_START: 0.1
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.DIV_FACTOR: 100
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.DECAY_STEP_LIST: [35, 45]
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.LR_DECAY: 0.1
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.LR_CLIP: 1e-07
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.LR_WARMUP: False
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.WARMUP_EPOCH: 1
2023-11-02 14:11:03   INFO  cfg.OPTIMIZATION.GRAD_NORM_CLIP: 10
2023-11-02 14:11:03   INFO  cfg.TAG: picture_waymo_ssl_seal_decoder_mask_0.2
2023-11-02 14:11:03   INFO  cfg.EXP_GROUP_PATH: picture_models
2023-11-02 14:11:03   INFO  Loading Waymo dataset
2023-11-02 14:11:09   INFO  Total skipped info 0
2023-11-02 14:11:09   INFO  Total samples for Waymo dataset: 158081
2023-11-02 14:11:09   INFO  Total sampled samples for Waymo dataset: 31617
2023-11-02 14:11:12   INFO  PICTURE(
  (vfe): DynamicPillarVFE_3d(
    (pfn_layers): ModuleList(
      (0): PFNLayerV2(
        (linear): Linear(in_features=11, out_features=64, bias=False)
        (norm): BatchNorm1d(64, eps=0.001, momentum=0.01, affine=True, track_running_stats=True)
        (relu): ReLU()
      )
      (1): PFNLayerV2(
        (linear): Linear(in_features=192, out_features=192, bias=False)
        (norm): BatchNorm1d(192, eps=0.001, momentum=0.01, affine=True, track_running_stats=True)
        (relu): ReLU()
      )
    )
  )
  (backbone_3d): DSVTBackboneMAE(
    (input_layer): DSVTInputLayer(
      (posembed_layers): ModuleList(
        (0): ModuleList(
          (0): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
          (1): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
          (2): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
          (3): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
        )
      )
    )
    (stage_0): ModuleList(
      (0): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
      (1): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
      (2): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
      (3): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
    )
    (residual_norm_stage_0): ModuleList(
      (0): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
      (1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
      (2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
      (3): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
    )
  )
  (map_to_bev_module): None
  (pfe): None
  (backbone_2d): LightDecoder(
    (input_layer): DSVTInputLayer(
      (posembed_layers): ModuleList(
        (0): ModuleList(
          (0): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
          (1): ModuleList(
            (0): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
            (1): PositionEmbeddingLearned(
              (position_embedding_head): Sequential(
                (0): Linear(in_features=2, out_features=192, bias=True)
                (1): BatchNorm1d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
                (2): ReLU(inplace=True)
                (3): Linear(in_features=192, out_features=192, bias=True)
              )
            )
          )
        )
      )
    )
    (stage_0): ModuleList(
      (0): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
      (1): DSVTBlock(
        (encoder_list): ModuleList(
          (0): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
          (1): DSVT_EncoderLayer(
            (win_attn): SetAttention(
              (self_attn): MultiheadAttention(
                (out_proj): NonDynamicallyQuantizableLinear(in_features=192, out_features=192, bias=True)
              )
              (linear1): Linear(in_features=192, out_features=384, bias=True)
              (dropout): Dropout(p=0, inplace=False)
              (linear2): Linear(in_features=384, out_features=192, bias=True)
              (norm1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (norm2): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
              (dropout1): Identity()
              (dropout2): Identity()
            )
            (norm): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
          )
        )
      )
    )
    (residual_norm_stage_0): ModuleList(
      (0): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
      (1): LayerNorm((192,), eps=1e-05, elementwise_affine=True)
    )
  )
  (dense_head): PretrainHead3D(
    (decoder_pred): Linear(in_features=192, out_features=48, bias=True)
    (decoder_seal): Linear(in_features=192, out_features=64, bias=True)
    (seal_loss): SmoothL1Loss()
  )
  (point_head): None
  (roi_head): None
)
2023-11-02 14:11:12   INFO  Total number of parameters: 6514608
2023-11-02 14:11:12   INFO  **********************Start training picture_models/picture_waymo_ssl_seal_decoder_mask_0.2(offline_30e)**********************
2023-11-02 14:12:55   INFO  epoch: 0/30, acc_iter=50, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:18, time_cost(all): 0:00:50/10:48:31, loss=3.474518624050178, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.16(1.03), norm=3.64311324209034, lr=1.5690440060698e-05
2023-11-02 14:13:45   INFO  epoch: 0/30, acc_iter=100, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:15, time_cost(all): 0:01:40/11:22:23, loss=3.3232281701528, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.14(1.03), norm=4.299809432530008, lr=2.1380880121396e-05
2023-11-02 14:14:35   INFO  epoch: 0/30, acc_iter=150, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:14, time_cost(all): 0:02:30/11:05:49, loss=3.171937716255422, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.1(1.03), norm=1.9027316744454468, lr=2.7071320182094e-05
2023-11-02 14:15:26   INFO  epoch: 0/30, acc_iter=200, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:33, time_cost(all): 0:03:21/10:47:13, loss=3.020647262358044, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.01(1.03), norm=3.5069585548361353, lr=3.2761760242792e-05
2023-11-02 14:16:16   INFO  epoch: 0/30, acc_iter=250, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:29, time_cost(all): 0:04:11/11:08:53, loss=2.869356808460667, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.95(1.03), norm=4.501940365915973, lr=3.845220030349e-05
2023-11-02 14:17:06   INFO  epoch: 0/30, acc_iter=300, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:50, time_cost(all): 0:05:01/10:58:56, loss=2.718066354563289, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.03(1.03), norm=1.1295138555038147, lr=4.4142640364188e-05
2023-11-02 14:17:57   INFO  epoch: 0/30, acc_iter=350, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:32, time_cost(all): 0:05:52/11:20:54, loss=2.566775900665911, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.19(1.03), norm=4.342894761449664, lr=4.9833080424886e-05
2023-11-02 14:18:47   INFO  epoch: 0/30, acc_iter=400, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:44, time_cost(all): 0:06:42/11:27:11, loss=2.415485446768534, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.07(1.03), norm=0.5358569513374347, lr=5.5523520485584e-05
2023-11-02 14:19:37   INFO  epoch: 0/30, acc_iter=450, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:40, time_cost(all): 0:07:32/10:41:34, loss=2.264194992871156, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.21(1.03), norm=0.7149994552132879, lr=6.1213960546282e-05
2023-11-02 14:20:28   INFO  epoch: 0/30, acc_iter=500, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:22, time_cost(all): 0:08:23/10:36:20, loss=2.112904538973778, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.05(1.03), norm=1.622809031992501, lr=6.690440060698e-05
2023-11-02 14:21:18   INFO  epoch: 0/30, acc_iter=550, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:17, time_cost(all): 0:09:13/10:52:03, loss=1.9616140850764, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.04(1.03), norm=2.810598578900278, lr=7.2594840667678e-05
2023-11-02 14:22:08   INFO  epoch: 0/30, acc_iter=600, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:03, time_cost(all): 0:10:03/10:59:13, loss=1.810323631179023, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.19(1.03), norm=3.925195716893989, lr=7.8285280728376e-05
2023-11-02 14:22:59   INFO  epoch: 0/30, acc_iter=650, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:54, time_cost(all): 0:10:54/10:43:14, loss=1.659033177281644, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.08(1.03), norm=1.8209725088163795, lr=8.3975720789074e-05
2023-11-02 14:23:49   INFO  epoch: 0/30, acc_iter=700, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:43, time_cost(all): 0:11:44/10:21:42, loss=1.507742723384267, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.88(1.03), norm=3.426161853771672, lr=8.9666160849772e-05
2023-11-02 14:24:39   INFO  epoch: 0/30, acc_iter=750, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:49, time_cost(all): 0:12:34/10:55:55, loss=1.356452269486889, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.9(1.03), norm=1.166690945210581, lr=9.535660091047e-05
2023-11-02 14:25:30   INFO  epoch: 0/30, acc_iter=800, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:28, time_cost(all): 0:13:25/10:55:26, loss=1.205161815589511, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.13(1.03), norm=1.2487077814219236, lr=0.000102617602427921
2023-11-02 14:26:20   INFO  epoch: 0/30, acc_iter=850, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:01, time_cost(all): 0:14:15/11:13:44, loss=1.053871361692134, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.13(1.03), norm=1.7547211961392166, lr=0.000116843702579666
2023-11-02 14:27:10   INFO  epoch: 0/30, acc_iter=900, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:17, time_cost(all): 0:15:05/10:17:34, loss=0.902580907794756, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.99(1.03), norm=0.9486329595478526, lr=0.000131069802731411
2023-11-02 14:28:01   INFO  epoch: 0/30, acc_iter=950, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:28, time_cost(all): 0:15:56/10:47:45, loss=0.751290453897378, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.14(1.03), norm=2.0777603576369095, lr=0.000145295902883156
2023-11-02 14:28:51   INFO  epoch: 0/30, acc_iter=1000, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:24, time_cost(all): 0:16:46/11:13:37, loss=0.61518114683672, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.14(1.03), norm=3.718484956672714, lr=0.000159522003034901
2023-11-02 14:29:41   INFO  epoch: 0/30, acc_iter=1050, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:37, time_cost(all): 0:17:36/10:52:57, loss=0.599577321447318, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.01(1.03), norm=4.124624199807763, lr=0.000173748103186646
2023-11-02 14:30:32   INFO  epoch: 0/30, acc_iter=1100, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:41, time_cost(all): 0:18:27/10:14:51, loss=0.599154642894635, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.89(1.03), norm=1.3149116033379653, lr=0.000187974203338391
2023-11-02 14:31:22   INFO  epoch: 0/30, acc_iter=1150, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:46, time_cost(all): 0:19:17/10:48:22, loss=0.598731964341953, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.96(1.03), norm=4.965342698806254, lr=0.000202200303490137
2023-11-02 14:32:12   INFO  epoch: 0/30, acc_iter=1200, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:04, time_cost(all): 0:20:07/10:15:37, loss=0.598309285789271, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.05(1.03), norm=4.181351058167614, lr=0.000216426403641882
2023-11-02 14:33:03   INFO  epoch: 0/30, acc_iter=1250, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:11, time_cost(all): 0:20:58/10:37:49, loss=0.597886607236588, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.97(1.03), norm=2.6758275167153975, lr=0.000230652503793627
2023-11-02 14:33:53   INFO  epoch: 0/30, acc_iter=1300, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 0:21:48/10:20:01, loss=0.597463928683906, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.06(1.03), norm=4.615609320404059, lr=0.000244878603945372
2023-11-02 14:34:43   INFO  epoch: 1/30, acc_iter=1368, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:34, time_cost(all): 0:22:38/10:45:22, loss=0.596889085852258, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.2(1.03), norm=2.0033836311745956, lr=0.000264226100151745
2023-11-02 14:35:34   INFO  epoch: 1/30, acc_iter=1418, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:43, time_cost(all): 0:23:29/10:09:01, loss=0.596466407299576, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.93(1.03), norm=2.9817093425272145, lr=0.00027845220030349
2023-11-02 14:36:24   INFO  epoch: 1/30, acc_iter=1468, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:40, time_cost(all): 0:24:19/10:41:50, loss=0.596043728746894, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.1(1.03), norm=4.948233728445498, lr=0.000292678300455235
2023-11-02 14:37:14   INFO  epoch: 1/30, acc_iter=1518, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:13, time_cost(all): 0:25:09/10:32:47, loss=0.595621050194211, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.15(1.03), norm=2.449458640220869, lr=0.00030690440060698
2023-11-02 14:38:05   INFO  epoch: 1/30, acc_iter=1568, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:49, time_cost(all): 0:26:00/10:40:37, loss=0.595198371641529, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.93(1.03), norm=3.17630516266659, lr=0.000321130500758725
2023-11-02 14:38:55   INFO  epoch: 1/30, acc_iter=1618, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:07, time_cost(all): 0:26:50/10:49:37, loss=0.594775693088847, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.87(1.03), norm=3.0625523614430867, lr=0.00033535660091047
2023-11-02 14:39:45   INFO  epoch: 1/30, acc_iter=1668, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:15:42, time_cost(all): 0:27:40/10:55:15, loss=0.594353014536164, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.01(1.03), norm=3.268648945759925, lr=0.000349582701062215
2023-11-02 14:40:36   INFO  epoch: 1/30, acc_iter=1718, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:55, time_cost(all): 0:28:31/10:37:17, loss=0.593930335983482, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.06(1.03), norm=4.931262669061594, lr=0.00036380880121396
2023-11-02 14:41:26   INFO  epoch: 1/30, acc_iter=1768, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:13:52, time_cost(all): 0:29:21/10:15:00, loss=0.5935076574308, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.96(1.03), norm=2.2074175313193116, lr=0.000378034901365706
2023-11-02 14:42:16   INFO  epoch: 1/30, acc_iter=1818, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:20, time_cost(all): 0:30:11/10:49:37, loss=0.593084978878118, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.2(1.03), norm=3.219674667194139, lr=0.000392261001517451
2023-11-02 14:43:07   INFO  epoch: 1/30, acc_iter=1868, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:16, time_cost(all): 0:31:02/10:36:37, loss=0.592662300325435, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.18(1.03), norm=3.7520298961289034, lr=0.000406487101669196
2023-11-02 14:43:57   INFO  epoch: 1/30, acc_iter=1918, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:42, time_cost(all): 0:31:52/10:56:00, loss=0.592239621772753, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.96(1.03), norm=3.2328764018566165, lr=0.000420713201820941
2023-11-02 14:44:47   INFO  epoch: 1/30, acc_iter=1968, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:11, time_cost(all): 0:32:42/10:16:18, loss=0.591816943220071, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.98(1.03), norm=1.5426964235506913, lr=0.000434939301972686
2023-11-02 14:45:38   INFO  epoch: 1/30, acc_iter=2018, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:46, time_cost(all): 0:33:33/10:32:13, loss=0.591394264667388, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.91(1.03), norm=0.9447100472705148, lr=0.000449165402124431
2023-11-02 14:46:28   INFO  epoch: 1/30, acc_iter=2068, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:57, time_cost(all): 0:34:23/10:53:38, loss=0.590971586114706, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.2(1.03), norm=1.1930272287652282, lr=0.000463391502276176
2023-11-02 14:47:18   INFO  epoch: 1/30, acc_iter=2118, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:25, time_cost(all): 0:35:13/10:01:10, loss=0.590548907562024, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.91(1.03), norm=2.136819918725502, lr=0.000477617602427921
2023-11-02 14:48:09   INFO  epoch: 1/30, acc_iter=2168, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:00, time_cost(all): 0:36:04/10:55:48, loss=0.590126229009341, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.06(1.03), norm=0.5596533614978502, lr=0.000491843702579666
2023-11-02 14:48:59   INFO  epoch: 1/30, acc_iter=2218, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:21, time_cost(all): 0:36:54/10:34:23, loss=0.589703550456659, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.12(1.03), norm=2.375701189438377, lr=0.000506069802731411
2023-11-02 14:49:49   INFO  epoch: 1/30, acc_iter=2268, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:22, time_cost(all): 0:37:44/9:59:41, loss=0.589280871903977, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.83(1.03), norm=2.1577991160557533, lr=0.000520295902883156
2023-11-02 14:50:40   INFO  epoch: 1/30, acc_iter=2318, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:06, time_cost(all): 0:38:35/10:28:55, loss=0.588858193351295, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.22(1.03), norm=1.3316585863360269, lr=0.000534522003034901
2023-11-02 14:51:30   INFO  epoch: 1/30, acc_iter=2368, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:22, time_cost(all): 0:39:25/10:37:14, loss=0.588435514798612, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.86(1.03), norm=3.1144801538128717, lr=0.000548748103186646
2023-11-02 14:52:20   INFO  epoch: 1/30, acc_iter=2418, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:40, time_cost(all): 0:40:15/10:04:06, loss=0.58801283624593, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.08(1.03), norm=0.7419643815900216, lr=0.000562974203338392
2023-11-02 14:53:11   INFO  epoch: 1/30, acc_iter=2468, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:55, time_cost(all): 0:41:06/10:36:38, loss=0.587590157693248, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.05(1.03), norm=0.7372618268277611, lr=0.000577200303490137
2023-11-02 14:54:01   INFO  epoch: 1/30, acc_iter=2518, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:56, time_cost(all): 0:41:56/10:16:26, loss=0.587167479140565, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.89(1.03), norm=4.072073958719293, lr=0.000591426403641882
2023-11-02 14:54:51   INFO  epoch: 1/30, acc_iter=2568, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:06, time_cost(all): 0:42:46/10:21:28, loss=0.586744800587883, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.09(1.03), norm=3.0932866640194914, lr=0.000605652503793627
2023-11-02 14:55:42   INFO  epoch: 1/30, acc_iter=2618, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 0:43:37/10:03:14, loss=0.586322122035201, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.19(1.03), norm=0.7186612730027808, lr=0.000619878603945372
2023-11-02 14:56:32   INFO  epoch: 2/30, acc_iter=2686, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:59, time_cost(all): 0:44:27/9:52:29, loss=0.585747279203553, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.94(1.03), norm=3.7950252853211603, lr=0.000639226100151745
2023-11-02 14:57:22   INFO  epoch: 2/30, acc_iter=2736, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:12, time_cost(all): 0:45:17/10:22:56, loss=0.58532460065087, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.99(1.03), norm=2.091459441424565, lr=0.00065345220030349
2023-11-02 14:58:13   INFO  epoch: 2/30, acc_iter=2786, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:59, time_cost(all): 0:46:08/10:04:55, loss=0.584901922098188, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.02(1.03), norm=3.7273075944904575, lr=0.000667678300455235
2023-11-02 14:59:03   INFO  epoch: 2/30, acc_iter=2836, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:28, time_cost(all): 0:46:58/10:12:57, loss=0.584479243545506, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.13(1.03), norm=0.7967589488159914, lr=0.00068190440060698
2023-11-02 14:59:53   INFO  epoch: 2/30, acc_iter=2886, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:07, time_cost(all): 0:47:48/10:39:36, loss=0.584056564992824, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.99(1.03), norm=2.265498558689618, lr=0.000696130500758725
2023-11-02 15:00:44   INFO  epoch: 2/30, acc_iter=2936, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:42, time_cost(all): 0:48:39/10:33:28, loss=0.583633886440141, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.1(1.03), norm=2.0385341052569297, lr=0.00071035660091047
2023-11-02 15:01:34   INFO  epoch: 2/30, acc_iter=2986, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:18, time_cost(all): 0:49:29/10:06:17, loss=0.583211207887459, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.21(1.03), norm=4.100345789026372, lr=0.000724582701062215
2023-11-02 15:02:24   INFO  epoch: 2/30, acc_iter=3036, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:18, time_cost(all): 0:50:19/10:18:52, loss=0.582788529334777, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.0(1.03), norm=1.4834829306550503, lr=0.00073880880121396
2023-11-02 15:03:15   INFO  epoch: 2/30, acc_iter=3086, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:58, time_cost(all): 0:51:10/10:24:42, loss=0.582365850782094, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.1(1.03), norm=2.2306036818310235, lr=0.000753034901365706
2023-11-02 15:04:05   INFO  epoch: 2/30, acc_iter=3136, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:13, time_cost(all): 0:52:00/9:41:16, loss=0.581943172229412, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.89(1.03), norm=4.248615345343586, lr=0.000767261001517451
2023-11-02 15:04:55   INFO  epoch: 2/30, acc_iter=3186, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:29, time_cost(all): 0:52:50/10:02:40, loss=0.58152049367673, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.15(1.03), norm=1.233179446787303, lr=0.000781487101669196
2023-11-02 15:05:46   INFO  epoch: 2/30, acc_iter=3236, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:35, time_cost(all): 0:53:41/10:20:42, loss=0.581097815124047, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.13(1.03), norm=3.4075257031124058, lr=0.000795713201820941
2023-11-02 15:06:36   INFO  epoch: 2/30, acc_iter=3286, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:39, time_cost(all): 0:54:31/9:59:02, loss=0.580675136571365, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.98(1.03), norm=3.9213876275369124, lr=0.000809939301972686
2023-11-02 15:07:26   INFO  epoch: 2/30, acc_iter=3336, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:32, time_cost(all): 0:55:21/10:19:29, loss=0.580252458018683, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.21(1.03), norm=0.7033918908254447, lr=0.000824165402124431
2023-11-02 15:08:17   INFO  epoch: 2/30, acc_iter=3386, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:21, time_cost(all): 0:56:12/10:22:59, loss=0.579829779466, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.84(1.03), norm=4.556690570115882, lr=0.000838391502276176
2023-11-02 15:09:07   INFO  epoch: 2/30, acc_iter=3436, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:19, time_cost(all): 0:57:02/9:48:14, loss=0.579407100913318, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.09(1.03), norm=2.7821172622271155, lr=0.000852617602427921
2023-11-02 15:09:57   INFO  epoch: 2/30, acc_iter=3486, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:54, time_cost(all): 0:57:52/10:05:57, loss=0.578984422360636, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.14(1.03), norm=1.0478674457873303, lr=0.000866843702579666
2023-11-02 15:10:48   INFO  epoch: 2/30, acc_iter=3536, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:14, time_cost(all): 0:58:43/10:00:10, loss=0.578561743807954, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.16(1.03), norm=3.1459831464949883, lr=0.000881069802731411
2023-11-02 15:11:38   INFO  epoch: 2/30, acc_iter=3586, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:16, time_cost(all): 0:59:33/10:07:47, loss=0.578139065255271, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.22(1.03), norm=2.6501038457856665, lr=0.000895295902883156
2023-11-02 15:12:28   INFO  epoch: 2/30, acc_iter=3636, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:22, time_cost(all): 1:00:23/10:28:25, loss=0.577716386702589, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.0(1.03), norm=4.476238252782907, lr=0.000909522003034901
2023-11-02 15:13:19   INFO  epoch: 2/30, acc_iter=3686, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:18, time_cost(all): 1:01:14/10:15:01, loss=0.577293708149907, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.94(1.03), norm=0.8031562275367459, lr=0.000923748103186646
2023-11-02 15:14:09   INFO  epoch: 2/30, acc_iter=3736, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:37, time_cost(all): 1:02:04/9:50:03, loss=0.576871029597224, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.96(1.03), norm=3.658141857299702, lr=0.000937974203338391
2023-11-02 15:14:59   INFO  epoch: 2/30, acc_iter=3786, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:55, time_cost(all): 1:02:54/9:39:05, loss=0.576448351044542, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.14(1.03), norm=3.9742484210540043, lr=0.000952200303490137
2023-11-02 15:15:50   INFO  epoch: 2/30, acc_iter=3836, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:52, time_cost(all): 1:03:45/9:48:53, loss=0.57602567249186, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.9(1.03), norm=3.261816633911703, lr=0.000966426403641882
2023-11-02 15:16:40   INFO  epoch: 2/30, acc_iter=3886, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 1:04:35/9:31:06, loss=0.575602993939177, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.83(1.03), norm=4.317006575691448, lr=0.000980652503793627
2023-11-02 15:17:30   INFO  epoch: 2/30, acc_iter=3936, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 1:05:25/9:33:35, loss=0.575180315386495, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.13(1.03), norm=1.0224202031243954, lr=0.000994878603945372
2023-11-02 15:18:21   INFO  epoch: 3/30, acc_iter=4004, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:01, time_cost(all): 1:06:16/9:28:09, loss=0.574605472554847, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.92(1.03), norm=4.6432858557543, lr=0.000998397059137832
2023-11-02 15:19:11   INFO  epoch: 3/30, acc_iter=4054, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:07, time_cost(all): 1:07:06/9:54:07, loss=0.574182794002165, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.85(1.03), norm=1.4821537636089543, lr=0.000996794118275663
2023-11-02 15:20:01   INFO  epoch: 3/30, acc_iter=4104, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:22, time_cost(all): 1:07:56/9:55:17, loss=0.573760115449483, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.01(1.03), norm=2.903665839572912, lr=0.000995191177413495
2023-11-02 15:20:52   INFO  epoch: 3/30, acc_iter=4154, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:02, time_cost(all): 1:08:47/10:12:22, loss=0.5733374368968, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.21(1.03), norm=3.0297426290586875, lr=0.000993588236551326
2023-11-02 15:21:42   INFO  epoch: 3/30, acc_iter=4204, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:17, time_cost(all): 1:09:37/9:54:07, loss=0.572914758344118, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.01(1.03), norm=3.617759691170706, lr=0.000991985295689158
2023-11-02 15:22:32   INFO  epoch: 3/30, acc_iter=4254, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:14, time_cost(all): 1:10:27/9:51:46, loss=0.572492079791436, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.92(1.03), norm=1.6547280010173075, lr=0.000990382354826989
2023-11-02 15:23:23   INFO  epoch: 3/30, acc_iter=4304, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:15:40, time_cost(all): 1:11:18/10:17:39, loss=0.572069401238753, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.05(1.03), norm=1.705005237196623, lr=0.000988779413964821
2023-11-02 15:24:13   INFO  epoch: 3/30, acc_iter=4354, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:41, time_cost(all): 1:12:08/9:38:05, loss=0.571646722686071, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.14(1.03), norm=1.453904991175662, lr=0.000987176473102652
2023-11-02 15:25:03   INFO  epoch: 3/30, acc_iter=4404, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:54, time_cost(all): 1:12:58/10:13:47, loss=0.571224044133389, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.06(1.03), norm=4.3139757612308784, lr=0.000985573532240484
2023-11-02 15:25:54   INFO  epoch: 3/30, acc_iter=4454, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:13, time_cost(all): 1:13:49/9:53:48, loss=0.570801365580706, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.91(1.03), norm=0.6516905261292667, lr=0.000983970591378315
2023-11-02 15:26:44   INFO  epoch: 3/30, acc_iter=4504, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:24, time_cost(all): 1:14:39/9:19:41, loss=0.570378687028024, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.07(1.03), norm=2.7508742840871436, lr=0.000982367650516147
2023-11-02 15:27:34   INFO  epoch: 3/30, acc_iter=4554, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:00, time_cost(all): 1:15:29/10:15:37, loss=0.569956008475342, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.98(1.03), norm=2.8447554545900653, lr=0.000980764709653978
2023-11-02 15:28:25   INFO  epoch: 3/30, acc_iter=4604, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:43, time_cost(all): 1:16:20/10:09:14, loss=0.56953332992266, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.01(1.03), norm=4.653992904139874, lr=0.00097916176879181
2023-11-02 15:29:15   INFO  epoch: 3/30, acc_iter=4654, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:27, time_cost(all): 1:17:10/10:10:30, loss=0.569110651369977, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.85(1.03), norm=1.3579166646551066, lr=0.000977558827929642
2023-11-02 15:30:05   INFO  epoch: 3/30, acc_iter=4704, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:46, time_cost(all): 1:18:00/9:48:00, loss=0.568687972817295, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.91(1.03), norm=3.649757440974894, lr=0.000975955887067473
2023-11-02 15:30:56   INFO  epoch: 3/30, acc_iter=4754, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:34, time_cost(all): 1:18:51/10:05:44, loss=0.568265294264613, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.04(1.03), norm=4.100689423075929, lr=0.000974352946205305
2023-11-02 15:31:46   INFO  epoch: 3/30, acc_iter=4804, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:07, time_cost(all): 1:19:41/10:03:06, loss=0.56784261571193, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.93(1.03), norm=2.6944701434282816, lr=0.000972750005343136
2023-11-02 15:32:36   INFO  epoch: 3/30, acc_iter=4854, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:10, time_cost(all): 1:20:31/9:34:27, loss=0.567419937159248, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.03(1.03), norm=3.3113250335019204, lr=0.000971147064480968
2023-11-02 15:33:27   INFO  epoch: 3/30, acc_iter=4904, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:22, time_cost(all): 1:21:22/9:27:04, loss=0.566997258606566, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.84(1.03), norm=1.2910139147842015, lr=0.000969544123618799
2023-11-02 15:34:17   INFO  epoch: 3/30, acc_iter=4954, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:14, time_cost(all): 1:22:12/9:22:39, loss=0.566574580053884, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.08(1.03), norm=1.3337740650842262, lr=0.000967941182756631
2023-11-02 15:35:07   INFO  epoch: 3/30, acc_iter=5004, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:21, time_cost(all): 1:23:02/9:48:19, loss=0.566151901501201, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.22(1.03), norm=0.6041450539837638, lr=0.000966338241894462
2023-11-02 15:35:58   INFO  epoch: 3/30, acc_iter=5054, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:47, time_cost(all): 1:23:53/10:05:29, loss=0.565729222948519, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.14(1.03), norm=1.706803936628035, lr=0.000964735301032294
2023-11-02 15:36:48   INFO  epoch: 3/30, acc_iter=5104, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:42, time_cost(all): 1:24:43/9:46:14, loss=0.565306544395837, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.03(1.03), norm=4.904250287005155, lr=0.000963132360170126
2023-11-02 15:37:38   INFO  epoch: 3/30, acc_iter=5154, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:55, time_cost(all): 1:25:33/9:59:57, loss=0.564883865843154, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.88(1.03), norm=3.7901310128974863, lr=0.000961529419307957
2023-11-02 15:38:29   INFO  epoch: 3/30, acc_iter=5204, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:05, time_cost(all): 1:26:24/9:56:06, loss=0.564461187290472, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.89(1.03), norm=3.1630616372957956, lr=0.000959926478445789
2023-11-02 15:39:19   INFO  epoch: 3/30, acc_iter=5254, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 1:27:14/9:42:06, loss=0.56403850873779, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.12(1.03), norm=3.436537223439437, lr=0.00095832353758362
2023-11-02 15:40:09   INFO  epoch: 4/30, acc_iter=5322, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:19, time_cost(all): 1:28:04/9:38:13, loss=0.563463665906142, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.03(1.03), norm=1.2713284043243327, lr=0.000956143538011071
2023-11-02 15:41:00   INFO  epoch: 4/30, acc_iter=5372, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:30, time_cost(all): 1:28:55/9:06:28, loss=0.563040987353459, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.2(1.03), norm=3.4229884892545344, lr=0.000954540597148903
2023-11-02 15:41:50   INFO  epoch: 4/30, acc_iter=5422, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:34, time_cost(all): 1:29:45/9:32:14, loss=0.562618308800777, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.22(1.03), norm=4.976157785790867, lr=0.000952937656286734
2023-11-02 15:42:40   INFO  epoch: 4/30, acc_iter=5472, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:21, time_cost(all): 1:30:35/9:17:29, loss=0.562195630248095, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.87(1.03), norm=4.086706278490755, lr=0.000951334715424566
2023-11-02 15:43:31   INFO  epoch: 4/30, acc_iter=5522, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:20, time_cost(all): 1:31:26/9:15:58, loss=0.561772951695413, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.11(1.03), norm=2.223419464824585, lr=0.000949731774562397
2023-11-02 15:44:21   INFO  epoch: 4/30, acc_iter=5572, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:40, time_cost(all): 1:32:16/9:19:51, loss=0.56135027314273, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.04(1.03), norm=3.1518573940556776, lr=0.000948128833700229
2023-11-02 15:45:11   INFO  epoch: 4/30, acc_iter=5622, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:44, time_cost(all): 1:33:06/9:42:15, loss=0.560927594590048, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.06(1.03), norm=2.867566218076186, lr=0.00094652589283806
2023-11-02 15:46:02   INFO  epoch: 4/30, acc_iter=5672, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:49, time_cost(all): 1:33:57/9:05:59, loss=0.560504916037366, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.16(1.03), norm=3.5855880789031764, lr=0.000944922951975892
2023-11-02 15:46:52   INFO  epoch: 4/30, acc_iter=5722, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:15:06, time_cost(all): 1:34:47/9:56:01, loss=0.560082237484683, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.95(1.03), norm=2.212264323772592, lr=0.000943320011113723
2023-11-02 15:47:42   INFO  epoch: 4/30, acc_iter=5772, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:18, time_cost(all): 1:35:37/9:19:06, loss=0.559659558932001, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.04(1.03), norm=2.572590656486167, lr=0.000941717070251555
2023-11-02 15:48:33   INFO  epoch: 4/30, acc_iter=5822, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:21, time_cost(all): 1:36:28/9:55:05, loss=0.559236880379319, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.88(1.03), norm=1.4788809245555572, lr=0.000940114129389386
2023-11-02 15:49:23   INFO  epoch: 4/30, acc_iter=5872, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:26, time_cost(all): 1:37:18/9:28:28, loss=0.558814201826636, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.17(1.03), norm=4.095209704526857, lr=0.000938511188527218
2023-11-02 15:50:13   INFO  epoch: 4/30, acc_iter=5922, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:28, time_cost(all): 1:38:08/9:41:03, loss=0.558391523273954, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.9(1.03), norm=0.9798103853951512, lr=0.000936908247665049
2023-11-02 15:51:04   INFO  epoch: 4/30, acc_iter=5972, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:23, time_cost(all): 1:38:59/9:41:35, loss=0.557968844721272, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.94(1.03), norm=2.9287473392319407, lr=0.000935305306802881
2023-11-02 15:51:54   INFO  epoch: 4/30, acc_iter=6022, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:27, time_cost(all): 1:39:49/9:04:42, loss=0.55754616616859, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.88(1.03), norm=2.9747462606654227, lr=0.000933702365940713
2023-11-02 15:52:44   INFO  epoch: 4/30, acc_iter=6072, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:57, time_cost(all): 1:40:39/8:57:31, loss=0.557123487615907, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.85(1.03), norm=2.2578025812201483, lr=0.000932099425078544
2023-11-02 15:53:35   INFO  epoch: 4/30, acc_iter=6122, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:51, time_cost(all): 1:41:30/8:55:35, loss=0.556700809063225, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.86(1.03), norm=4.1916169102269585, lr=0.000930496484216376
2023-11-02 15:54:25   INFO  epoch: 4/30, acc_iter=6172, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:48, time_cost(all): 1:42:20/9:30:33, loss=0.556278130510543, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.85(1.03), norm=0.8230473043230999, lr=0.000928893543354207
2023-11-02 15:55:15   INFO  epoch: 4/30, acc_iter=6222, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:28, time_cost(all): 1:43:10/9:42:18, loss=0.55585545195786, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.03(1.03), norm=3.202342490472587, lr=0.000927290602492039
2023-11-02 15:56:06   INFO  epoch: 4/30, acc_iter=6272, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:14, time_cost(all): 1:44:01/8:52:19, loss=0.555432773405178, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.11(1.03), norm=3.0933489187699093, lr=0.00092568766162987
2023-11-02 15:56:56   INFO  epoch: 4/30, acc_iter=6322, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:34, time_cost(all): 1:44:51/9:24:40, loss=0.555010094852496, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.98(1.03), norm=4.998342198477728, lr=0.000924084720767702
2023-11-02 15:57:46   INFO  epoch: 4/30, acc_iter=6372, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:44, time_cost(all): 1:45:41/9:29:00, loss=0.554587416299813, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.22(1.03), norm=1.1307136305666026, lr=0.000922481779905533
2023-11-02 15:58:37   INFO  epoch: 4/30, acc_iter=6422, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:43, time_cost(all): 1:46:32/9:23:34, loss=0.554164737747131, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.2(1.03), norm=2.0082229323216643, lr=0.000920878839043365
2023-11-02 15:59:27   INFO  epoch: 4/30, acc_iter=6472, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:02, time_cost(all): 1:47:22/8:51:28, loss=0.553742059194449, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.05(1.03), norm=0.8530890466885372, lr=0.000919275898181197
2023-11-02 16:00:17   INFO  epoch: 4/30, acc_iter=6522, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 1:48:12/8:57:28, loss=0.553319380641766, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.2(1.03), norm=4.617744803677721, lr=0.000917672957319028
2023-11-02 16:01:08   INFO  epoch: 4/30, acc_iter=6572, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 1:49:03/9:05:03, loss=0.552896702089084, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.93(1.03), norm=3.8581617646914395, lr=0.00091607001645686
2023-11-02 16:01:58   INFO  epoch: 5/30, acc_iter=6640, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:15, time_cost(all): 1:49:53/9:19:29, loss=0.552321859257436, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.04(1.03), norm=0.6777274751261848, lr=0.00091389001688431
2023-11-02 16:02:48   INFO  epoch: 5/30, acc_iter=6690, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:45, time_cost(all): 1:50:43/9:16:01, loss=0.551899180704754, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.1(1.03), norm=0.5594989145557312, lr=0.000912287076022142
2023-11-02 16:03:39   INFO  epoch: 5/30, acc_iter=6740, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:58, time_cost(all): 1:51:34/8:52:44, loss=0.551476502152072, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.02(1.03), norm=4.844676104568094, lr=0.000910684135159974
2023-11-02 16:04:29   INFO  epoch: 5/30, acc_iter=6790, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:53, time_cost(all): 1:52:24/9:09:45, loss=0.551053823599389, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.14(1.03), norm=2.3265197776208586, lr=0.000909081194297805
2023-11-02 16:05:19   INFO  epoch: 5/30, acc_iter=6840, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:37, time_cost(all): 1:53:14/8:45:49, loss=0.550631145046707, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.14(1.03), norm=0.5845172455286871, lr=0.000907478253435637
2023-11-02 16:06:10   INFO  epoch: 5/30, acc_iter=6890, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:03, time_cost(all): 1:54:05/9:28:46, loss=0.550208466494025, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.15(1.03), norm=2.9788833155858216, lr=0.000905875312573468
2023-11-02 16:07:00   INFO  epoch: 5/30, acc_iter=6940, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:10, time_cost(all): 1:54:55/9:11:54, loss=0.549785787941342, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.85(1.03), norm=4.871945621177579, lr=0.0009042723717113
2023-11-02 16:07:50   INFO  epoch: 5/30, acc_iter=6990, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:57, time_cost(all): 1:55:45/8:49:59, loss=0.54936310938866, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.15(1.03), norm=3.4214847534374604, lr=0.000902669430849131
2023-11-02 16:08:41   INFO  epoch: 5/30, acc_iter=7040, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:20, time_cost(all): 1:56:36/8:42:33, loss=0.548940430835978, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.0(1.03), norm=3.579576145649748, lr=0.000901066489986963
2023-11-02 16:09:31   INFO  epoch: 5/30, acc_iter=7090, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:41, time_cost(all): 1:57:26/9:01:16, loss=0.548517752283295, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.91(1.03), norm=4.146739869438251, lr=0.000899463549124794
2023-11-02 16:10:21   INFO  epoch: 5/30, acc_iter=7140, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:20, time_cost(all): 1:58:16/8:56:46, loss=0.548095073730613, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.93(1.03), norm=1.6802948204890074, lr=0.000897860608262626
2023-11-02 16:11:12   INFO  epoch: 5/30, acc_iter=7190, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:35, time_cost(all): 1:59:07/8:55:52, loss=0.547672395177931, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.01(1.03), norm=3.3268684210083115, lr=0.000896257667400457
2023-11-02 16:12:02   INFO  epoch: 5/30, acc_iter=7240, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:11, time_cost(all): 1:59:57/8:42:35, loss=0.547249716625249, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.16(1.03), norm=0.856156504004511, lr=0.000894654726538289
2023-11-02 16:12:52   INFO  epoch: 5/30, acc_iter=7290, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:33, time_cost(all): 2:00:47/9:18:42, loss=0.546827038072566, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.84(1.03), norm=4.129331659738552, lr=0.00089305178567612
2023-11-02 16:13:43   INFO  epoch: 5/30, acc_iter=7340, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:38, time_cost(all): 2:01:38/9:15:20, loss=0.546404359519884, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.86(1.03), norm=0.5077739095974623, lr=0.000891448844813952
2023-11-02 16:14:33   INFO  epoch: 5/30, acc_iter=7390, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:17, time_cost(all): 2:02:28/8:53:38, loss=0.545981680967202, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.09(1.03), norm=0.8265912465070084, lr=0.000889845903951784
2023-11-02 16:15:23   INFO  epoch: 5/30, acc_iter=7440, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:34, time_cost(all): 2:03:18/9:04:45, loss=0.545559002414519, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.08(1.03), norm=2.0286874287279466, lr=0.000888242963089615
2023-11-02 16:16:14   INFO  epoch: 5/30, acc_iter=7490, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:59, time_cost(all): 2:04:09/8:57:14, loss=0.545136323861837, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.08(1.03), norm=2.8705303180924338, lr=0.000886640022227447
2023-11-02 16:17:04   INFO  epoch: 5/30, acc_iter=7540, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:04, time_cost(all): 2:04:59/9:01:53, loss=0.544713645309155, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.09(1.03), norm=3.918385312990217, lr=0.000885037081365278
2023-11-02 16:17:54   INFO  epoch: 5/30, acc_iter=7590, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:33, time_cost(all): 2:05:49/9:01:17, loss=0.544290966756472, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.11(1.03), norm=2.215581097999524, lr=0.00088343414050311
2023-11-02 16:18:45   INFO  epoch: 5/30, acc_iter=7640, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:42, time_cost(all): 2:06:40/8:37:07, loss=0.54386828820379, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.98(1.03), norm=3.14798559579547, lr=0.000881831199640941
2023-11-02 16:19:35   INFO  epoch: 5/30, acc_iter=7690, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:35, time_cost(all): 2:07:30/8:53:19, loss=0.543445609651108, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.22(1.03), norm=2.4103381079518194, lr=0.000880228258778773
2023-11-02 16:20:25   INFO  epoch: 5/30, acc_iter=7740, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:47, time_cost(all): 2:08:20/8:56:51, loss=0.543022931098426, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.07(1.03), norm=2.203964412846492, lr=0.000878625317916604
2023-11-02 16:21:16   INFO  epoch: 5/30, acc_iter=7790, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:54, time_cost(all): 2:09:11/9:05:44, loss=0.542600252545743, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.05(1.03), norm=1.1859354468040306, lr=0.000877022377054436
2023-11-02 16:22:06   INFO  epoch: 5/30, acc_iter=7840, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 2:10:01/8:27:58, loss=0.542177573993061, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.08(1.03), norm=4.551556027845868, lr=0.000875419436192267
2023-11-02 16:22:56   INFO  epoch: 5/30, acc_iter=7890, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 2:10:51/9:15:54, loss=0.541754895440379, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.15(1.03), norm=2.503183086334766, lr=0.000873816495330099
2023-11-02 16:23:47   INFO  epoch: 6/30, acc_iter=7958, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:01, time_cost(all): 2:11:42/8:43:16, loss=0.541180052608731, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.93(1.03), norm=2.465430823290539, lr=0.00087163649575755
2023-11-02 16:24:37   INFO  epoch: 6/30, acc_iter=8008, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:46, time_cost(all): 2:12:32/8:51:40, loss=0.540757374056048, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.9(1.03), norm=1.4328786694336113, lr=0.000870033554895381
2023-11-02 16:25:27   INFO  epoch: 6/30, acc_iter=8058, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:22, time_cost(all): 2:13:22/8:49:52, loss=0.540334695503366, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.16(1.03), norm=3.2608750452567734, lr=0.000868430614033213
2023-11-02 16:26:18   INFO  epoch: 6/30, acc_iter=8108, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:53, time_cost(all): 2:14:13/8:58:09, loss=0.539912016950684, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.86(1.03), norm=4.553282170827968, lr=0.000866827673171045
2023-11-02 16:27:08   INFO  epoch: 6/30, acc_iter=8158, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:15, time_cost(all): 2:15:03/8:30:19, loss=0.539489338398002, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.95(1.03), norm=3.2174422076050453, lr=0.000865224732308876
2023-11-02 16:27:58   INFO  epoch: 6/30, acc_iter=8208, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:45, time_cost(all): 2:15:53/8:35:32, loss=0.539066659845319, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.95(1.03), norm=4.258707012611273, lr=0.000863621791446708
2023-11-02 16:28:49   INFO  epoch: 6/30, acc_iter=8258, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:49, time_cost(all): 2:16:44/8:24:10, loss=0.538643981292637, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.02(1.03), norm=4.887172630627512, lr=0.000862018850584539
2023-11-02 16:29:39   INFO  epoch: 6/30, acc_iter=8308, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:22, time_cost(all): 2:17:34/8:37:22, loss=0.538221302739955, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.18(1.03), norm=2.1276033037678728, lr=0.000860415909722371
2023-11-02 16:30:29   INFO  epoch: 6/30, acc_iter=8358, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:12, time_cost(all): 2:18:24/8:37:29, loss=0.537798624187272, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.05(1.03), norm=2.780320753279673, lr=0.000858812968860202
2023-11-02 16:31:19   INFO  epoch: 6/30, acc_iter=8408, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:20, time_cost(all): 2:19:14/8:29:00, loss=0.53737594563459, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.09(1.03), norm=2.8433487333499596, lr=0.000857210027998034
2023-11-02 16:32:10   INFO  epoch: 6/30, acc_iter=8458, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:30, time_cost(all): 2:20:05/8:39:20, loss=0.536953267081908, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.9(1.03), norm=3.518083719747158, lr=0.000855607087135865
2023-11-02 16:33:00   INFO  epoch: 6/30, acc_iter=8508, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:03, time_cost(all): 2:20:55/8:59:42, loss=0.536530588529225, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.87(1.03), norm=3.2051713160896744, lr=0.000854004146273697
2023-11-02 16:33:50   INFO  epoch: 6/30, acc_iter=8558, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:11, time_cost(all): 2:21:45/8:57:17, loss=0.536107909976543, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.18(1.03), norm=4.469418589053795, lr=0.000852401205411528
2023-11-02 16:34:41   INFO  epoch: 6/30, acc_iter=8608, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:14, time_cost(all): 2:22:36/9:04:04, loss=0.535685231423861, d_time=0.00(0.00), f_time=0.91(1.01), b_time=0.9(1.03), norm=2.5529939407405795, lr=0.00085079826454936
2023-11-02 16:35:31   INFO  epoch: 6/30, acc_iter=8658, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:57, time_cost(all): 2:23:26/8:26:22, loss=0.535262552871179, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.11(1.03), norm=1.8795088050371112, lr=0.000849195323687191
2023-11-02 16:36:21   INFO  epoch: 6/30, acc_iter=8708, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:39, time_cost(all): 2:24:16/8:16:27, loss=0.534839874318496, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.93(1.03), norm=0.8173821020721942, lr=0.000847592382825023
2023-11-02 16:37:12   INFO  epoch: 6/30, acc_iter=8758, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:30, time_cost(all): 2:25:07/8:32:31, loss=0.534417195765814, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.22(1.03), norm=3.5923602635541614, lr=0.000845989441962855
2023-11-02 16:38:02   INFO  epoch: 6/30, acc_iter=8808, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:14, time_cost(all): 2:25:57/8:30:05, loss=0.533994517213132, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.02(1.03), norm=3.202421370564236, lr=0.000844386501100686
2023-11-02 16:38:52   INFO  epoch: 6/30, acc_iter=8858, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:00, time_cost(all): 2:26:47/8:33:40, loss=0.533571838660449, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.84(1.03), norm=1.2040447328863584, lr=0.000842783560238518
2023-11-02 16:39:43   INFO  epoch: 6/30, acc_iter=8908, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:11, time_cost(all): 2:27:38/8:38:59, loss=0.533149160107767, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.99(1.03), norm=3.3592608351206725, lr=0.000841180619376349
2023-11-02 16:40:33   INFO  epoch: 6/30, acc_iter=8958, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:21, time_cost(all): 2:28:28/8:41:35, loss=0.532726481555085, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.92(1.03), norm=2.1599255541305817, lr=0.000839577678514181
2023-11-02 16:41:23   INFO  epoch: 6/30, acc_iter=9008, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:40, time_cost(all): 2:29:18/8:45:18, loss=0.532303803002402, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.91(1.03), norm=3.2749658711736127, lr=0.000837974737652012
2023-11-02 16:42:14   INFO  epoch: 6/30, acc_iter=9058, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:57, time_cost(all): 2:30:09/8:43:39, loss=0.53188112444972, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.01(1.03), norm=2.581484277589663, lr=0.000836371796789844
2023-11-02 16:43:04   INFO  epoch: 6/30, acc_iter=9108, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:57, time_cost(all): 2:30:59/8:23:50, loss=0.531458445897038, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.08(1.03), norm=0.8249329173769174, lr=0.000834768855927675
2023-11-02 16:43:54   INFO  epoch: 6/30, acc_iter=9158, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 2:31:49/8:17:22, loss=0.531035767344356, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.93(1.03), norm=3.2654702933954702, lr=0.000833165915065507
2023-11-02 16:44:45   INFO  epoch: 6/30, acc_iter=9208, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 2:32:40/8:27:52, loss=0.530613088791673, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.1(1.03), norm=1.8800284146427142, lr=0.000831562974203338
2023-11-02 16:45:35   INFO  epoch: 7/30, acc_iter=9276, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:31, time_cost(all): 2:33:30/8:45:32, loss=0.530038245960025, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.1(1.03), norm=4.826057924588035, lr=0.000829382974630789
2023-11-02 16:46:25   INFO  epoch: 7/30, acc_iter=9326, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:43, time_cost(all): 2:34:20/8:28:16, loss=0.529615567407343, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.2(1.03), norm=1.0354516751252707, lr=0.000827780033768621
2023-11-02 16:47:16   INFO  epoch: 7/30, acc_iter=9376, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:57, time_cost(all): 2:35:11/8:49:37, loss=0.529192888854661, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.18(1.03), norm=4.960955550912888, lr=0.000826177092906452
2023-11-02 16:48:06   INFO  epoch: 7/30, acc_iter=9426, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:44, time_cost(all): 2:36:01/8:12:15, loss=0.528770210301978, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.09(1.03), norm=3.2305082761351587, lr=0.000824574152044284
2023-11-02 16:48:56   INFO  epoch: 7/30, acc_iter=9476, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:07, time_cost(all): 2:36:51/8:18:04, loss=0.528347531749296, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.12(1.03), norm=1.7296267385449584, lr=0.000822971211182115
2023-11-02 16:49:47   INFO  epoch: 7/30, acc_iter=9526, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:37, time_cost(all): 2:37:42/8:18:23, loss=0.527924853196614, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.84(1.03), norm=2.76642198136225, lr=0.000821368270319947
2023-11-02 16:50:37   INFO  epoch: 7/30, acc_iter=9576, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:09, time_cost(all): 2:38:32/8:44:25, loss=0.527502174643931, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.88(1.03), norm=3.3792179850627226, lr=0.000819765329457779
2023-11-02 16:51:27   INFO  epoch: 7/30, acc_iter=9626, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:48, time_cost(all): 2:39:22/8:38:39, loss=0.527079496091249, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.93(1.03), norm=0.7126100952874415, lr=0.00081816238859561
2023-11-02 16:52:18   INFO  epoch: 7/30, acc_iter=9676, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:04, time_cost(all): 2:40:13/8:41:54, loss=0.526656817538567, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.97(1.03), norm=1.046943179067772, lr=0.000816559447733442
2023-11-02 16:53:08   INFO  epoch: 7/30, acc_iter=9726, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:43, time_cost(all): 2:41:03/8:42:24, loss=0.526234138985885, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.21(1.03), norm=4.3228921409405885, lr=0.000814956506871273
2023-11-02 16:53:58   INFO  epoch: 7/30, acc_iter=9776, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:27, time_cost(all): 2:41:53/8:31:32, loss=0.525811460433202, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.92(1.03), norm=3.2752226406438263, lr=0.000813353566009105
2023-11-02 16:54:49   INFO  epoch: 7/30, acc_iter=9826, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:37, time_cost(all): 2:42:44/8:39:31, loss=0.52538878188052, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.05(1.03), norm=0.636807296577712, lr=0.000811750625146936
2023-11-02 16:55:39   INFO  epoch: 7/30, acc_iter=9876, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:40, time_cost(all): 2:43:34/8:39:18, loss=0.524966103327838, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.1(1.03), norm=0.9451651592134781, lr=0.000810147684284768
2023-11-02 16:56:29   INFO  epoch: 7/30, acc_iter=9926, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:33, time_cost(all): 2:44:24/8:17:17, loss=0.524543424775155, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.12(1.03), norm=3.1978895232997173, lr=0.000808544743422599
2023-11-02 16:57:20   INFO  epoch: 7/30, acc_iter=9976, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:54, time_cost(all): 2:45:15/8:23:02, loss=0.524120746222473, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.04(1.03), norm=4.636643314358102, lr=0.000806941802560431
2023-11-02 16:58:10   INFO  epoch: 7/30, acc_iter=10026, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:44, time_cost(all): 2:46:05/8:25:23, loss=0.523698067669791, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.86(1.03), norm=2.914456186187838, lr=0.000805338861698263
2023-11-02 16:59:00   INFO  epoch: 7/30, acc_iter=10076, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:47, time_cost(all): 2:46:55/8:16:48, loss=0.523275389117108, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.85(1.03), norm=1.0858506959848608, lr=0.000803735920836094
2023-11-02 16:59:51   INFO  epoch: 7/30, acc_iter=10126, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:02, time_cost(all): 2:47:46/8:20:14, loss=0.522852710564426, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.05(1.03), norm=1.640226699876515, lr=0.000802132979973925
2023-11-02 17:00:41   INFO  epoch: 7/30, acc_iter=10176, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:02, time_cost(all): 2:48:36/7:50:30, loss=0.522430032011744, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.16(1.03), norm=0.8620157925916818, lr=0.000800530039111757
2023-11-02 17:01:31   INFO  epoch: 7/30, acc_iter=10226, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:18, time_cost(all): 2:49:26/8:04:13, loss=0.522007353459061, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.02(1.03), norm=1.28397303592688, lr=0.000798927098249589
2023-11-02 17:02:22   INFO  epoch: 7/30, acc_iter=10276, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:30, time_cost(all): 2:50:17/8:30:03, loss=0.521584674906379, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.93(1.03), norm=0.5528667631142867, lr=0.00079732415738742
2023-11-02 17:03:12   INFO  epoch: 7/30, acc_iter=10326, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:44, time_cost(all): 2:51:07/7:48:45, loss=0.521161996353697, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.09(1.03), norm=2.764804423163058, lr=0.000795721216525252
2023-11-02 17:04:02   INFO  epoch: 7/30, acc_iter=10376, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:43, time_cost(all): 2:51:57/8:18:51, loss=0.520739317801015, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.15(1.03), norm=2.817508418015591, lr=0.000794118275663083
2023-11-02 17:04:53   INFO  epoch: 7/30, acc_iter=10426, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:02, time_cost(all): 2:52:48/8:23:42, loss=0.520316639248332, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.15(1.03), norm=4.984096438674875, lr=0.000792515334800915
2023-11-02 17:05:43   INFO  epoch: 7/30, acc_iter=10476, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:10, time_cost(all): 2:53:38/8:07:13, loss=0.51989396069565, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.09(1.03), norm=3.161740118406233, lr=0.000790912393938746
2023-11-02 17:06:33   INFO  epoch: 7/30, acc_iter=10526, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 2:54:28/8:21:27, loss=0.519471282142968, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.22(1.03), norm=1.002479200963479, lr=0.000789309453076578
2023-11-02 17:07:24   INFO  epoch: 8/30, acc_iter=10594, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:05, time_cost(all): 2:55:19/8:15:22, loss=0.51889643931132, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.02(1.03), norm=2.6849806608665543, lr=0.000787129453504029
2023-11-02 17:08:14   INFO  epoch: 8/30, acc_iter=10644, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:49, time_cost(all): 2:56:09/7:47:11, loss=0.518473760758637, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.22(1.03), norm=2.1237896336920863, lr=0.00078552651264186
2023-11-02 17:09:04   INFO  epoch: 8/30, acc_iter=10694, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:36, time_cost(all): 2:56:59/7:55:14, loss=0.518051082205955, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.23(1.03), norm=0.6668253467024455, lr=0.000783923571779692
2023-11-02 17:09:55   INFO  epoch: 8/30, acc_iter=10744, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:14, time_cost(all): 2:57:50/8:09:18, loss=0.517628403653273, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.85(1.03), norm=0.7815376365008819, lr=0.000782320630917523
2023-11-02 17:10:45   INFO  epoch: 8/30, acc_iter=10794, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:02, time_cost(all): 2:58:40/7:50:02, loss=0.517205725100591, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.0(1.03), norm=4.703976160796758, lr=0.000780717690055355
2023-11-02 17:11:35   INFO  epoch: 8/30, acc_iter=10844, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:32, time_cost(all): 2:59:30/7:51:35, loss=0.516783046547908, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.11(1.03), norm=4.060863559913421, lr=0.000779114749193186
2023-11-02 17:12:26   INFO  epoch: 8/30, acc_iter=10894, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:47, time_cost(all): 3:00:21/7:59:12, loss=0.516360367995226, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.99(1.03), norm=1.1612290229808768, lr=0.000777511808331018
2023-11-02 17:13:16   INFO  epoch: 8/30, acc_iter=10944, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:46, time_cost(all): 3:01:11/8:00:16, loss=0.515937689442544, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.12(1.03), norm=3.236343247734644, lr=0.00077590886746885
2023-11-02 17:14:06   INFO  epoch: 8/30, acc_iter=10994, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:19, time_cost(all): 3:02:01/7:52:02, loss=0.515515010889861, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.93(1.03), norm=1.3215515230622747, lr=0.000774305926606681
2023-11-02 17:14:57   INFO  epoch: 8/30, acc_iter=11044, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:38, time_cost(all): 3:02:52/8:03:41, loss=0.515092332337179, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.22(1.03), norm=4.308376957919727, lr=0.000772702985744513
2023-11-02 17:15:47   INFO  epoch: 8/30, acc_iter=11094, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:28, time_cost(all): 3:03:42/8:04:35, loss=0.514669653784497, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.18(1.03), norm=4.567686799374472, lr=0.000771100044882344
2023-11-02 17:16:37   INFO  epoch: 8/30, acc_iter=11144, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:54, time_cost(all): 3:04:32/8:06:20, loss=0.514246975231814, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.95(1.03), norm=4.034887888004107, lr=0.000769497104020176
2023-11-02 17:17:28   INFO  epoch: 8/30, acc_iter=11194, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:21, time_cost(all): 3:05:23/7:36:50, loss=0.513824296679132, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.86(1.03), norm=2.6191304871574728, lr=0.000767894163158007
2023-11-02 17:18:18   INFO  epoch: 8/30, acc_iter=11244, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:09:57, time_cost(all): 3:06:13/7:40:46, loss=0.51340161812645, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.22(1.03), norm=2.1807198121434763, lr=0.000766291222295839
2023-11-02 17:19:08   INFO  epoch: 8/30, acc_iter=11294, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:25, time_cost(all): 3:07:03/8:12:47, loss=0.512978939573768, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.01(1.03), norm=2.7742497722704664, lr=0.00076468828143367
2023-11-02 17:19:59   INFO  epoch: 8/30, acc_iter=11344, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:35, time_cost(all): 3:07:54/8:07:33, loss=0.512556261021085, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.91(1.03), norm=0.7190975266460184, lr=0.000763085340571502
2023-11-02 17:20:49   INFO  epoch: 8/30, acc_iter=11394, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:32, time_cost(all): 3:08:44/8:01:04, loss=0.512133582468403, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.88(1.03), norm=3.564511243441418, lr=0.000761482399709333
2023-11-02 17:21:39   INFO  epoch: 8/30, acc_iter=11444, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:14, time_cost(all): 3:09:34/7:38:40, loss=0.511710903915721, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.0(1.03), norm=0.8035867566499135, lr=0.000759879458847165
2023-11-02 17:22:30   INFO  epoch: 8/30, acc_iter=11494, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:24, time_cost(all): 3:10:25/7:44:49, loss=0.511288225363038, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.88(1.03), norm=3.259702458987504, lr=0.000758276517984996
2023-11-02 17:23:20   INFO  epoch: 8/30, acc_iter=11544, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:18, time_cost(all): 3:11:15/7:30:21, loss=0.510865546810356, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.17(1.03), norm=0.6461619425090164, lr=0.000756673577122828
2023-11-02 17:24:10   INFO  epoch: 8/30, acc_iter=11594, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:40, time_cost(all): 3:12:05/7:51:05, loss=0.510442868257674, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.06(1.03), norm=1.2698161964347934, lr=0.00075507063626066
2023-11-02 17:25:01   INFO  epoch: 8/30, acc_iter=11644, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:50, time_cost(all): 3:12:56/7:30:19, loss=0.510020189704991, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.88(1.03), norm=4.355751140055467, lr=0.000753467695398491
2023-11-02 17:25:51   INFO  epoch: 8/30, acc_iter=11694, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:45, time_cost(all): 3:13:46/7:31:59, loss=0.509597511152309, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.92(1.03), norm=4.891948984396211, lr=0.000751864754536323
2023-11-02 17:26:41   INFO  epoch: 8/30, acc_iter=11744, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:59, time_cost(all): 3:14:36/7:29:37, loss=0.509174832599627, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.08(1.03), norm=1.2495954374962575, lr=0.000750261813674154
2023-11-02 17:27:32   INFO  epoch: 8/30, acc_iter=11794, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:06, time_cost(all): 3:15:27/7:38:41, loss=0.508752154046945, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.12(1.03), norm=4.3397741551983575, lr=0.000748658872811986
2023-11-02 17:28:22   INFO  epoch: 8/30, acc_iter=11844, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:19, time_cost(all): 3:16:17/8:04:34, loss=0.508329475494262, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.85(1.03), norm=4.959108895235692, lr=0.000747055931949817
2023-11-02 17:29:12   INFO  epoch: 9/30, acc_iter=11912, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:39, time_cost(all): 3:17:07/7:28:40, loss=0.507754632662614, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.92(1.03), norm=4.620576191142311, lr=0.000744875932377268
2023-11-02 17:30:03   INFO  epoch: 9/30, acc_iter=11962, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:44, time_cost(all): 3:17:58/8:05:38, loss=0.507331954109932, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.15(1.03), norm=2.5694908892363535, lr=0.0007432729915151
2023-11-02 17:30:53   INFO  epoch: 9/30, acc_iter=12012, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:53, time_cost(all): 3:18:48/7:21:58, loss=0.50690927555725, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.21(1.03), norm=2.4749580014583055, lr=0.000741670050652931
2023-11-02 17:31:43   INFO  epoch: 9/30, acc_iter=12062, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:20, time_cost(all): 3:19:38/7:22:42, loss=0.506486597004567, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.9(1.03), norm=4.846724534484305, lr=0.000740067109790763
2023-11-02 17:32:34   INFO  epoch: 9/30, acc_iter=12112, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:05, time_cost(all): 3:20:29/8:01:20, loss=0.506063918451885, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.16(1.03), norm=0.9236316212317484, lr=0.000738464168928594
2023-11-02 17:33:24   INFO  epoch: 9/30, acc_iter=12162, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:54, time_cost(all): 3:21:19/8:02:58, loss=0.505641239899203, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.93(1.03), norm=1.431533445267773, lr=0.000736861228066426
2023-11-02 17:34:14   INFO  epoch: 9/30, acc_iter=12212, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:25, time_cost(all): 3:22:09/7:56:42, loss=0.50521856134652, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.85(1.03), norm=1.1452000544354763, lr=0.000735258287204257
2023-11-02 17:35:05   INFO  epoch: 9/30, acc_iter=12262, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:38, time_cost(all): 3:23:00/7:47:10, loss=0.504795882793838, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.12(1.03), norm=2.400915795727898, lr=0.000733655346342089
2023-11-02 17:35:55   INFO  epoch: 9/30, acc_iter=12312, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:46, time_cost(all): 3:23:50/7:46:56, loss=0.504373204241156, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.86(1.03), norm=4.852660365260351, lr=0.000732052405479921
2023-11-02 17:36:45   INFO  epoch: 9/30, acc_iter=12362, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:04, time_cost(all): 3:24:40/7:42:55, loss=0.503950525688474, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.96(1.03), norm=1.6931264975105642, lr=0.000730449464617752
2023-11-02 17:37:36   INFO  epoch: 9/30, acc_iter=12412, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:06, time_cost(all): 3:25:31/7:35:44, loss=0.503527847135791, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.96(1.03), norm=4.69233948500274, lr=0.000728846523755584
2023-11-02 17:38:26   INFO  epoch: 9/30, acc_iter=12462, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:43, time_cost(all): 3:26:21/7:15:43, loss=0.503105168583109, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.91(1.03), norm=0.8384241474138702, lr=0.000727243582893415
2023-11-02 17:39:16   INFO  epoch: 9/30, acc_iter=12512, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:38, time_cost(all): 3:27:11/7:31:11, loss=0.502682490030427, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.18(1.03), norm=4.665435018426703, lr=0.000725640642031247
2023-11-02 17:40:07   INFO  epoch: 9/30, acc_iter=12562, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:20, time_cost(all): 3:28:02/7:14:43, loss=0.502259811477744, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.06(1.03), norm=1.3111451004528398, lr=0.000724037701169078
2023-11-02 17:40:57   INFO  epoch: 9/30, acc_iter=12612, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:51, time_cost(all): 3:28:52/7:32:58, loss=0.501837132925062, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.04(1.03), norm=2.74794972923399, lr=0.00072243476030691
2023-11-02 17:41:47   INFO  epoch: 9/30, acc_iter=12662, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:45, time_cost(all): 3:29:42/7:51:05, loss=0.50141445437238, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.93(1.03), norm=3.754288529978255, lr=0.000720831819444741
2023-11-02 17:42:38   INFO  epoch: 9/30, acc_iter=12712, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:59, time_cost(all): 3:30:33/7:27:28, loss=0.500991775819697, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.86(1.03), norm=1.7194131924731688, lr=0.000719228878582573
2023-11-02 17:43:28   INFO  epoch: 9/30, acc_iter=12762, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:03, time_cost(all): 3:31:23/7:17:04, loss=0.500569097267015, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.92(1.03), norm=2.1589512388850896, lr=0.000717625937720404
2023-11-02 17:44:18   INFO  epoch: 9/30, acc_iter=12812, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:52, time_cost(all): 3:32:13/7:49:58, loss=0.500146418714333, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.19(1.03), norm=1.1521131150173771, lr=0.000716022996858236
2023-11-02 17:45:09   INFO  epoch: 9/30, acc_iter=12862, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:05, time_cost(all): 3:33:04/7:10:37, loss=0.49972374016165, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.84(1.03), norm=1.673626296314519, lr=0.000714420055996067
2023-11-02 17:45:59   INFO  epoch: 9/30, acc_iter=12912, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:17, time_cost(all): 3:33:54/7:19:46, loss=0.499301061608968, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.06(1.03), norm=0.709889365722757, lr=0.000712817115133899
2023-11-02 17:46:49   INFO  epoch: 9/30, acc_iter=12962, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:35, time_cost(all): 3:34:44/7:30:27, loss=0.498878383056286, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.86(1.03), norm=0.5974271835822368, lr=0.000711214174271731
2023-11-02 17:47:40   INFO  epoch: 9/30, acc_iter=13012, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:45, time_cost(all): 3:35:35/7:23:40, loss=0.498455704503604, d_time=0.00(0.00), f_time=1.21(1.01), b_time=1.04(1.03), norm=3.5758470311943684, lr=0.000709611233409562
2023-11-02 17:48:30   INFO  epoch: 9/30, acc_iter=13062, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:53, time_cost(all): 3:36:25/7:36:01, loss=0.498033025950921, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.85(1.03), norm=1.8232488864093896, lr=0.000708008292547394
2023-11-02 17:49:20   INFO  epoch: 9/30, acc_iter=13112, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 3:37:15/7:40:56, loss=0.497610347398239, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.07(1.03), norm=3.8564242788854335, lr=0.000706405351685225
2023-11-02 17:50:11   INFO  epoch: 9/30, acc_iter=13162, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 3:38:06/7:38:00, loss=0.497187668845557, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.08(1.03), norm=3.974407321485968, lr=0.000704802410823057
2023-11-02 17:51:01   INFO  epoch: 10/30, acc_iter=13230, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:18, time_cost(all): 3:38:56/7:17:49, loss=0.496612826013909, d_time=0.00(0.00), f_time=0.91(1.01), b_time=0.83(1.03), norm=2.2466158825464904, lr=0.000702622411250508
2023-11-02 17:51:51   INFO  epoch: 10/30, acc_iter=13280, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:30, time_cost(all): 3:39:46/7:16:40, loss=0.496190147461226, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.2(1.03), norm=0.9804471082398367, lr=0.000701019470388339
2023-11-02 17:52:42   INFO  epoch: 10/30, acc_iter=13330, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:09, time_cost(all): 3:40:37/7:37:02, loss=0.495767468908544, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.18(1.03), norm=3.1202017495955436, lr=0.000699416529526171
2023-11-02 17:53:32   INFO  epoch: 10/30, acc_iter=13380, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:44, time_cost(all): 3:41:27/7:15:04, loss=0.495344790355862, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.92(1.03), norm=3.6900849174199073, lr=0.000697813588664002
2023-11-02 17:54:22   INFO  epoch: 10/30, acc_iter=13430, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:09, time_cost(all): 3:42:17/7:26:56, loss=0.49492211180318, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.92(1.03), norm=2.8741227133785, lr=0.000696210647801834
2023-11-02 17:55:13   INFO  epoch: 10/30, acc_iter=13480, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:08, time_cost(all): 3:43:08/7:21:52, loss=0.494499433250497, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.2(1.03), norm=4.27254690825669, lr=0.000694607706939665
2023-11-02 17:56:03   INFO  epoch: 10/30, acc_iter=13530, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:40, time_cost(all): 3:43:58/7:17:57, loss=0.494076754697815, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.98(1.03), norm=3.9013241548573516, lr=0.000693004766077497
2023-11-02 17:56:53   INFO  epoch: 10/30, acc_iter=13580, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:57, time_cost(all): 3:44:48/7:16:17, loss=0.493654076145133, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.15(1.03), norm=0.6209432992098872, lr=0.000691401825215328
2023-11-02 17:57:44   INFO  epoch: 10/30, acc_iter=13630, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:13:56, time_cost(all): 3:45:39/6:57:39, loss=0.49323139759245, d_time=0.00(0.00), f_time=0.91(1.01), b_time=0.92(1.03), norm=3.6410999951859986, lr=0.00068979888435316
2023-11-02 17:58:34   INFO  epoch: 10/30, acc_iter=13680, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:26, time_cost(all): 3:46:29/7:13:33, loss=0.492808719039768, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.04(1.03), norm=3.772972929491563, lr=0.000688195943490992
2023-11-02 17:59:24   INFO  epoch: 10/30, acc_iter=13730, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:48, time_cost(all): 3:47:19/7:28:38, loss=0.492386040487086, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.83(1.03), norm=2.9362246473805422, lr=0.000686593002628823
2023-11-02 18:00:15   INFO  epoch: 10/30, acc_iter=13780, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:18, time_cost(all): 3:48:10/7:22:17, loss=0.491963361934403, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.18(1.03), norm=3.279531389130865, lr=0.000684990061766655
2023-11-02 18:01:05   INFO  epoch: 10/30, acc_iter=13830, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:04, time_cost(all): 3:49:00/6:57:01, loss=0.491540683381721, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.15(1.03), norm=2.9705716372938107, lr=0.000683387120904486
2023-11-02 18:01:55   INFO  epoch: 10/30, acc_iter=13880, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:24, time_cost(all): 3:49:50/6:55:15, loss=0.491118004829039, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.12(1.03), norm=4.743983228701674, lr=0.000681784180042318
2023-11-02 18:02:46   INFO  epoch: 10/30, acc_iter=13930, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:20, time_cost(all): 3:50:41/6:54:44, loss=0.490695326276357, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.87(1.03), norm=0.5785401488234589, lr=0.000680181239180149
2023-11-02 18:03:36   INFO  epoch: 10/30, acc_iter=13980, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:09:03, time_cost(all): 3:51:31/7:08:54, loss=0.490272647723674, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.11(1.03), norm=2.092008818513541, lr=0.000678578298317981
2023-11-02 18:04:26   INFO  epoch: 10/30, acc_iter=14030, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:34, time_cost(all): 3:52:21/7:32:10, loss=0.489849969170992, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.21(1.03), norm=0.7952282465868685, lr=0.000676975357455812
2023-11-02 18:05:17   INFO  epoch: 10/30, acc_iter=14080, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:02, time_cost(all): 3:53:12/7:10:41, loss=0.48942729061831, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.06(1.03), norm=2.5347570238792043, lr=0.000675372416593644
2023-11-02 18:06:07   INFO  epoch: 10/30, acc_iter=14130, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:19, time_cost(all): 3:54:02/6:49:28, loss=0.489004612065627, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.0(1.03), norm=1.4823053546398963, lr=0.000673769475731475
2023-11-02 18:06:57   INFO  epoch: 10/30, acc_iter=14180, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:16, time_cost(all): 3:54:52/7:01:06, loss=0.488581933512945, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.11(1.03), norm=3.244105367701119, lr=0.000672166534869307
2023-11-02 18:07:48   INFO  epoch: 10/30, acc_iter=14230, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:39, time_cost(all): 3:55:43/7:23:44, loss=0.488159254960263, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.01(1.03), norm=1.5946851848685681, lr=0.000670563594007139
2023-11-02 18:08:38   INFO  epoch: 10/30, acc_iter=14280, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:38, time_cost(all): 3:56:33/7:00:45, loss=0.48773657640758, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.07(1.03), norm=2.493865188537871, lr=0.00066896065314497
2023-11-02 18:09:28   INFO  epoch: 10/30, acc_iter=14330, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:57, time_cost(all): 3:57:23/7:05:29, loss=0.487313897854898, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.23(1.03), norm=2.8692390996360118, lr=0.000667357712282802
2023-11-02 18:10:19   INFO  epoch: 10/30, acc_iter=14380, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:00, time_cost(all): 3:58:14/7:08:34, loss=0.486891219302216, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.94(1.03), norm=4.519429713511831, lr=0.000665754771420633
2023-11-02 18:11:09   INFO  epoch: 10/30, acc_iter=14430, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:10, time_cost(all): 3:59:04/6:59:42, loss=0.486468540749533, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.13(1.03), norm=3.6900472873222308, lr=0.000664151830558465
2023-11-02 18:11:59   INFO  epoch: 10/30, acc_iter=14480, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 3:59:54/7:07:43, loss=0.486045862196851, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.2(1.03), norm=1.281734484213502, lr=0.000662548889696296
2023-11-02 18:12:50   INFO  epoch: 11/30, acc_iter=14548, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:12, time_cost(all): 4:00:45/6:41:31, loss=0.485471019365203, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.17(1.03), norm=1.1202120666268536, lr=0.000660368890123747
2023-11-02 18:13:40   INFO  epoch: 11/30, acc_iter=14598, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:01, time_cost(all): 4:01:35/6:59:08, loss=0.485048340812521, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.85(1.03), norm=2.291795123096663, lr=0.000658765949261579
2023-11-02 18:14:30   INFO  epoch: 11/30, acc_iter=14648, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:18, time_cost(all): 4:02:25/7:05:15, loss=0.484625662259839, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.04(1.03), norm=3.0214125693405904, lr=0.00065716300839941
2023-11-02 18:15:21   INFO  epoch: 11/30, acc_iter=14698, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:30, time_cost(all): 4:03:16/7:04:10, loss=0.484202983707156, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.88(1.03), norm=2.9647710936259077, lr=0.000655560067537242
2023-11-02 18:16:11   INFO  epoch: 11/30, acc_iter=14748, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:08, time_cost(all): 4:04:06/7:19:23, loss=0.483780305154474, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.86(1.03), norm=1.0115669855325644, lr=0.000653957126675073
2023-11-02 18:17:01   INFO  epoch: 11/30, acc_iter=14798, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:26, time_cost(all): 4:04:56/6:53:36, loss=0.483357626601792, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.98(1.03), norm=4.276092366176465, lr=0.000652354185812905
2023-11-02 18:17:52   INFO  epoch: 11/30, acc_iter=14848, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:15, time_cost(all): 4:05:47/7:10:07, loss=0.482934948049109, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.2(1.03), norm=2.6387500022690946, lr=0.000650751244950736
2023-11-02 18:18:42   INFO  epoch: 11/30, acc_iter=14898, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:18, time_cost(all): 4:06:37/6:38:40, loss=0.482512269496427, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.01(1.03), norm=0.5141486499653243, lr=0.000649148304088568
2023-11-02 18:19:32   INFO  epoch: 11/30, acc_iter=14948, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:15:14, time_cost(all): 4:07:27/7:03:16, loss=0.482089590943745, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.03(1.03), norm=2.9088131322062787, lr=0.0006475453632264
2023-11-02 18:20:23   INFO  epoch: 11/30, acc_iter=14998, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:57, time_cost(all): 4:08:18/7:01:35, loss=0.481666912391063, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.17(1.03), norm=2.1946845326788114, lr=0.000645942422364231
2023-11-02 18:21:13   INFO  epoch: 11/30, acc_iter=15048, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:40, time_cost(all): 4:09:08/6:56:58, loss=0.48124423383838, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.13(1.03), norm=1.8600429493645692, lr=0.000644339481502062
2023-11-02 18:22:03   INFO  epoch: 11/30, acc_iter=15098, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:09, time_cost(all): 4:09:58/7:02:34, loss=0.480821555285698, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.93(1.03), norm=1.559769458803237, lr=0.000642736540639894
2023-11-02 18:22:54   INFO  epoch: 11/30, acc_iter=15148, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:12, time_cost(all): 4:10:49/7:06:40, loss=0.480398876733016, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.84(1.03), norm=3.9636684094773345, lr=0.000641133599777726
2023-11-02 18:23:44   INFO  epoch: 11/30, acc_iter=15198, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:47, time_cost(all): 4:11:39/6:58:50, loss=0.479976198180333, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.22(1.03), norm=3.710056098375635, lr=0.000639530658915557
2023-11-02 18:24:34   INFO  epoch: 11/30, acc_iter=15248, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:46, time_cost(all): 4:12:29/6:59:04, loss=0.479553519627651, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.09(1.03), norm=3.1056177777220544, lr=0.000637927718053389
2023-11-02 18:25:25   INFO  epoch: 11/30, acc_iter=15298, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:38, time_cost(all): 4:13:20/6:45:14, loss=0.479130841074969, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.96(1.03), norm=4.035238087854293, lr=0.00063632477719122
2023-11-02 18:26:15   INFO  epoch: 11/30, acc_iter=15348, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:53, time_cost(all): 4:14:10/6:53:21, loss=0.478708162522286, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.97(1.03), norm=4.780806158754396, lr=0.000634721836329052
2023-11-02 18:27:05   INFO  epoch: 11/30, acc_iter=15398, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:20, time_cost(all): 4:15:00/7:04:14, loss=0.478285483969604, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.87(1.03), norm=4.873132612100658, lr=0.000633118895466883
2023-11-02 18:27:56   INFO  epoch: 11/30, acc_iter=15448, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:23, time_cost(all): 4:15:51/6:28:51, loss=0.477862805416922, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.91(1.03), norm=4.3157913674303945, lr=0.000631515954604715
2023-11-02 18:28:46   INFO  epoch: 11/30, acc_iter=15498, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:22, time_cost(all): 4:16:41/6:33:23, loss=0.47744012686424, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.91(1.03), norm=0.9947963637188524, lr=0.000629913013742546
2023-11-02 18:29:36   INFO  epoch: 11/30, acc_iter=15548, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:41, time_cost(all): 4:17:31/7:04:54, loss=0.477017448311557, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.07(1.03), norm=0.7018924945026137, lr=0.000628310072880378
2023-11-02 18:30:27   INFO  epoch: 11/30, acc_iter=15598, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:42, time_cost(all): 4:18:22/6:51:08, loss=0.476594769758875, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.93(1.03), norm=4.884172725917705, lr=0.00062670713201821
2023-11-02 18:31:17   INFO  epoch: 11/30, acc_iter=15648, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:56, time_cost(all): 4:19:12/6:55:08, loss=0.476172091206193, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.01(1.03), norm=1.0265602846913309, lr=0.000625104191156041
2023-11-02 18:32:07   INFO  epoch: 11/30, acc_iter=15698, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:01, time_cost(all): 4:20:02/6:57:39, loss=0.47574941265351, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.16(1.03), norm=4.92603768002415, lr=0.000623501250293873
2023-11-02 18:32:58   INFO  epoch: 11/30, acc_iter=15748, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 4:20:53/6:49:01, loss=0.475326734100828, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.06(1.03), norm=3.0348679367182303, lr=0.000621898309431704
2023-11-02 18:33:48   INFO  epoch: 11/30, acc_iter=15798, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 4:21:43/6:28:18, loss=0.474904055548146, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.11(1.03), norm=4.404595320426227, lr=0.000620295368569536
2023-11-02 18:34:38   INFO  epoch: 12/30, acc_iter=15866, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:58, time_cost(all): 4:22:33/7:00:01, loss=0.474329212716498, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.0(1.03), norm=1.7505214555805126, lr=0.000618115368996987
2023-11-02 18:35:29   INFO  epoch: 12/30, acc_iter=15916, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:43, time_cost(all): 4:23:24/6:54:56, loss=0.473906534163815, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.11(1.03), norm=2.654485071350952, lr=0.000616512428134818
2023-11-02 18:36:19   INFO  epoch: 12/30, acc_iter=15966, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:53, time_cost(all): 4:24:14/6:45:11, loss=0.473483855611133, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.16(1.03), norm=2.091231498636782, lr=0.00061490948727265
2023-11-02 18:37:09   INFO  epoch: 12/30, acc_iter=16016, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:57, time_cost(all): 4:25:04/6:26:35, loss=0.473061177058451, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.92(1.03), norm=3.462603997444135, lr=0.000613306546410481
2023-11-02 18:38:00   INFO  epoch: 12/30, acc_iter=16066, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:32, time_cost(all): 4:25:55/6:54:06, loss=0.472638498505769, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.93(1.03), norm=4.932861499503903, lr=0.000611703605548313
2023-11-02 18:38:50   INFO  epoch: 12/30, acc_iter=16116, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:22, time_cost(all): 4:26:45/6:27:54, loss=0.472215819953086, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.06(1.03), norm=3.5887451371545604, lr=0.000610100664686144
2023-11-02 18:39:40   INFO  epoch: 12/30, acc_iter=16166, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:17:01, time_cost(all): 4:27:35/6:49:05, loss=0.471793141400404, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.2(1.03), norm=3.4885128161510464, lr=0.000608497723823976
2023-11-02 18:40:31   INFO  epoch: 12/30, acc_iter=16216, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:16:04, time_cost(all): 4:28:26/6:26:57, loss=0.471370462847722, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.21(1.03), norm=2.648613203938227, lr=0.000606894782961807
2023-11-02 18:41:21   INFO  epoch: 12/30, acc_iter=16266, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:15:14, time_cost(all): 4:29:16/6:45:04, loss=0.470947784295039, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.89(1.03), norm=4.0373237397954, lr=0.000605291842099639
2023-11-02 18:42:11   INFO  epoch: 12/30, acc_iter=16316, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:41, time_cost(all): 4:30:06/6:34:41, loss=0.470525105742357, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.9(1.03), norm=4.693949922207434, lr=0.00060368890123747
2023-11-02 18:43:02   INFO  epoch: 12/30, acc_iter=16366, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:20, time_cost(all): 4:30:57/6:15:04, loss=0.470102427189675, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.08(1.03), norm=4.316886988777915, lr=0.000602085960375302
2023-11-02 18:43:52   INFO  epoch: 12/30, acc_iter=16416, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:56, time_cost(all): 4:31:47/6:22:17, loss=0.469679748636992, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.1(1.03), norm=3.024263221315109, lr=0.000600483019513133
2023-11-02 18:44:42   INFO  epoch: 12/30, acc_iter=16466, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:44, time_cost(all): 4:32:37/6:23:09, loss=0.46925707008431, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.06(1.03), norm=1.177124142455748, lr=0.000598880078650965
2023-11-02 18:45:33   INFO  epoch: 12/30, acc_iter=16516, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:09:55, time_cost(all): 4:33:28/6:47:54, loss=0.468834391531628, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.21(1.03), norm=0.5828764304050813, lr=0.000597277137788797
2023-11-02 18:46:23   INFO  epoch: 12/30, acc_iter=16566, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:17, time_cost(all): 4:34:18/6:45:15, loss=0.468411712978946, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.95(1.03), norm=3.5855918775733944, lr=0.000595674196926628
2023-11-02 18:47:13   INFO  epoch: 12/30, acc_iter=16616, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:59, time_cost(all): 4:35:08/6:19:30, loss=0.467989034426263, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.14(1.03), norm=4.588337307946666, lr=0.00059407125606446
2023-11-02 18:48:04   INFO  epoch: 12/30, acc_iter=16666, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:03, time_cost(all): 4:35:59/6:27:35, loss=0.467566355873581, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.99(1.03), norm=3.5110343795023464, lr=0.000592468315202291
2023-11-02 18:48:54   INFO  epoch: 12/30, acc_iter=16716, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:46, time_cost(all): 4:36:49/6:37:10, loss=0.467143677320899, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.15(1.03), norm=1.760249001842503, lr=0.000590865374340123
2023-11-02 18:49:44   INFO  epoch: 12/30, acc_iter=16766, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:21, time_cost(all): 4:37:39/6:34:40, loss=0.466720998768216, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.16(1.03), norm=3.7480486024210524, lr=0.000589262433477954
2023-11-02 18:50:34   INFO  epoch: 12/30, acc_iter=16816, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:05, time_cost(all): 4:38:29/6:06:18, loss=0.466298320215534, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.99(1.03), norm=1.2455825065555945, lr=0.000587659492615786
2023-11-02 18:51:25   INFO  epoch: 12/30, acc_iter=16866, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:38, time_cost(all): 4:39:20/6:43:07, loss=0.465875641662852, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.11(1.03), norm=3.850454011857276, lr=0.000586056551753617
2023-11-02 18:52:15   INFO  epoch: 12/30, acc_iter=16916, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:33, time_cost(all): 4:40:10/6:28:46, loss=0.465452963110169, d_time=0.00(0.00), f_time=0.91(1.01), b_time=0.99(1.03), norm=4.719451401320931, lr=0.000584453610891449
2023-11-02 18:53:05   INFO  epoch: 12/30, acc_iter=16966, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:52, time_cost(all): 4:41:00/6:08:34, loss=0.465030284557487, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.17(1.03), norm=3.7568035251422094, lr=0.00058285067002928
2023-11-02 18:53:56   INFO  epoch: 12/30, acc_iter=17016, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:52, time_cost(all): 4:41:51/6:06:43, loss=0.464607606004805, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.03(1.03), norm=4.502267762804347, lr=0.000581247729167112
2023-11-02 18:54:46   INFO  epoch: 12/30, acc_iter=17066, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 4:42:41/6:05:34, loss=0.464184927452122, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.06(1.03), norm=4.407008059281305, lr=0.000579644788304943
2023-11-02 18:55:36   INFO  epoch: 12/30, acc_iter=17116, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 4:43:31/6:21:49, loss=0.46376224889944, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.23(1.03), norm=1.7603567219400036, lr=0.000578041847442775
2023-11-02 18:56:27   INFO  epoch: 13/30, acc_iter=17184, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:52, time_cost(all): 4:44:22/6:30:41, loss=0.463187406067792, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.1(1.03), norm=1.028710923962274, lr=0.000575861847870226
2023-11-02 18:57:17   INFO  epoch: 13/30, acc_iter=17234, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:00, time_cost(all): 4:45:12/6:36:16, loss=0.46276472751511, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.12(1.03), norm=2.610208957051687, lr=0.000574258907008057
2023-11-02 18:58:07   INFO  epoch: 13/30, acc_iter=17284, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:51, time_cost(all): 4:46:02/5:58:52, loss=0.462342048962428, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.89(1.03), norm=1.0277942237078734, lr=0.000572655966145889
2023-11-02 18:58:58   INFO  epoch: 13/30, acc_iter=17334, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:59, time_cost(all): 4:46:53/6:08:08, loss=0.461919370409745, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.21(1.03), norm=2.364468233187834, lr=0.000571053025283721
2023-11-02 18:59:48   INFO  epoch: 13/30, acc_iter=17384, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:15, time_cost(all): 4:47:43/6:00:25, loss=0.461496691857063, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.9(1.03), norm=0.8979168837433142, lr=0.000569450084421552
2023-11-02 19:00:38   INFO  epoch: 13/30, acc_iter=17434, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:33, time_cost(all): 4:48:33/6:27:35, loss=0.461074013304381, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.08(1.03), norm=2.350639850896659, lr=0.000567847143559384
2023-11-02 19:01:29   INFO  epoch: 13/30, acc_iter=17484, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:32, time_cost(all): 4:49:24/6:11:57, loss=0.460651334751698, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.17(1.03), norm=0.6383012273321097, lr=0.000566244202697215
2023-11-02 19:02:19   INFO  epoch: 13/30, acc_iter=17534, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:17, time_cost(all): 4:50:14/6:27:30, loss=0.460228656199016, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.06(1.03), norm=3.8070705667501192, lr=0.000564641261835047
2023-11-02 19:03:09   INFO  epoch: 13/30, acc_iter=17584, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:32, time_cost(all): 4:51:04/6:23:52, loss=0.459805977646334, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.18(1.03), norm=4.347482942157601, lr=0.000563038320972878
2023-11-02 19:04:00   INFO  epoch: 13/30, acc_iter=17634, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:26, time_cost(all): 4:51:55/6:07:22, loss=0.459383299093652, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.85(1.03), norm=4.979638983993114, lr=0.00056143538011071
2023-11-02 19:04:50   INFO  epoch: 13/30, acc_iter=17684, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:23, time_cost(all): 4:52:45/6:22:16, loss=0.458960620540969, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.19(1.03), norm=3.6366865033695195, lr=0.000559832439248541
2023-11-02 19:05:40   INFO  epoch: 13/30, acc_iter=17734, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:07, time_cost(all): 4:53:35/5:52:41, loss=0.458537941988287, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.06(1.03), norm=3.6746889044989297, lr=0.000558229498386373
2023-11-02 19:06:31   INFO  epoch: 13/30, acc_iter=17784, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:41, time_cost(all): 4:54:26/6:05:55, loss=0.458115263435605, d_time=0.00(0.00), f_time=1.16(1.01), b_time=0.89(1.03), norm=1.3865075081823806, lr=0.000556626557524204
2023-11-02 19:07:21   INFO  epoch: 13/30, acc_iter=17834, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:01, time_cost(all): 4:55:16/6:03:00, loss=0.457692584882922, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.16(1.03), norm=4.208377206033546, lr=0.000555023616662036
2023-11-02 19:08:11   INFO  epoch: 13/30, acc_iter=17884, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:26, time_cost(all): 4:56:06/6:07:23, loss=0.45726990633024, d_time=0.00(0.00), f_time=1.16(1.01), b_time=0.87(1.03), norm=1.0141457057446617, lr=0.000553420675799867
2023-11-02 19:09:02   INFO  epoch: 13/30, acc_iter=17934, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:27, time_cost(all): 4:56:57/6:11:02, loss=0.456847227777558, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.95(1.03), norm=3.288218171181184, lr=0.000551817734937699
2023-11-02 19:09:52   INFO  epoch: 13/30, acc_iter=17984, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:39, time_cost(all): 4:57:47/6:20:49, loss=0.456424549224875, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.17(1.03), norm=2.7693051343658652, lr=0.000550214794075531
2023-11-02 19:10:42   INFO  epoch: 13/30, acc_iter=18034, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:17, time_cost(all): 4:58:37/5:54:56, loss=0.456001870672193, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.06(1.03), norm=2.4042634173359274, lr=0.000548611853213362
2023-11-02 19:11:33   INFO  epoch: 13/30, acc_iter=18084, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:08, time_cost(all): 4:59:28/5:46:04, loss=0.455579192119511, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.07(1.03), norm=0.8543094583876636, lr=0.000547008912351194
2023-11-02 19:12:23   INFO  epoch: 13/30, acc_iter=18134, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:06, time_cost(all): 5:00:18/6:15:17, loss=0.455156513566829, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.2(1.03), norm=2.5267442232543904, lr=0.000545405971489025
2023-11-02 19:13:13   INFO  epoch: 13/30, acc_iter=18184, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:29, time_cost(all): 5:01:08/5:51:46, loss=0.454733835014146, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.86(1.03), norm=2.81609367576041, lr=0.000543803030626857
2023-11-02 19:14:04   INFO  epoch: 13/30, acc_iter=18234, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:49, time_cost(all): 5:01:59/5:49:16, loss=0.454311156461464, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.84(1.03), norm=2.9005156328745776, lr=0.000542200089764688
2023-11-02 19:14:54   INFO  epoch: 13/30, acc_iter=18284, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:50, time_cost(all): 5:02:49/6:11:15, loss=0.453888477908782, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.19(1.03), norm=3.860752961209433, lr=0.00054059714890252
2023-11-02 19:15:44   INFO  epoch: 13/30, acc_iter=18334, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:00, time_cost(all): 5:03:39/5:54:53, loss=0.453465799356099, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.03(1.03), norm=3.9725212008825466, lr=0.000538994208040351
2023-11-02 19:16:35   INFO  epoch: 13/30, acc_iter=18384, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 5:04:30/6:06:13, loss=0.453043120803417, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.12(1.03), norm=4.734952203980884, lr=0.000537391267178183
2023-11-02 19:17:25   INFO  epoch: 13/30, acc_iter=18434, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 5:05:20/6:13:10, loss=0.452620442250735, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.07(1.03), norm=2.610854190485912, lr=0.000535788326316015
2023-11-02 19:18:15   INFO  epoch: 14/30, acc_iter=18502, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:38, time_cost(all): 5:06:10/6:05:39, loss=0.452045599419087, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.92(1.03), norm=1.4890790460234251, lr=0.000533608326743465
2023-11-02 19:19:06   INFO  epoch: 14/30, acc_iter=18552, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:45, time_cost(all): 5:07:01/6:12:20, loss=0.451622920866404, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.02(1.03), norm=1.078724776451541, lr=0.000532005385881297
2023-11-02 19:19:56   INFO  epoch: 14/30, acc_iter=18602, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:55, time_cost(all): 5:07:51/5:45:52, loss=0.451200242313722, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.91(1.03), norm=2.861936028431329, lr=0.000530402445019128
2023-11-02 19:20:46   INFO  epoch: 14/30, acc_iter=18652, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:43, time_cost(all): 5:08:41/6:09:10, loss=0.45077756376104, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.91(1.03), norm=3.7418248775502985, lr=0.00052879950415696
2023-11-02 19:21:37   INFO  epoch: 14/30, acc_iter=18702, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:56, time_cost(all): 5:09:32/5:36:32, loss=0.450354885208358, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.94(1.03), norm=4.299157006068747, lr=0.000527196563294792
2023-11-02 19:22:27   INFO  epoch: 14/30, acc_iter=18752, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:03, time_cost(all): 5:10:22/5:45:10, loss=0.449932206655675, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.1(1.03), norm=0.5771763404326473, lr=0.000525593622432623
2023-11-02 19:23:17   INFO  epoch: 14/30, acc_iter=18802, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:15:29, time_cost(all): 5:11:12/6:00:28, loss=0.449509528102993, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.18(1.03), norm=1.221239192669891, lr=0.000523990681570455
2023-11-02 19:24:08   INFO  epoch: 14/30, acc_iter=18852, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:38, time_cost(all): 5:12:03/6:02:37, loss=0.449086849550311, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.83(1.03), norm=4.933311656801226, lr=0.000522387740708286
2023-11-02 19:24:58   INFO  epoch: 14/30, acc_iter=18902, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:47, time_cost(all): 5:12:53/6:02:21, loss=0.448664170997628, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.22(1.03), norm=3.0478425408248073, lr=0.000520784799846118
2023-11-02 19:25:48   INFO  epoch: 14/30, acc_iter=18952, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:44, time_cost(all): 5:13:43/5:40:15, loss=0.448241492444946, d_time=0.00(0.00), f_time=1.21(1.01), b_time=1.15(1.03), norm=1.323683641476111, lr=0.000519181858983949
2023-11-02 19:26:39   INFO  epoch: 14/30, acc_iter=19002, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:16, time_cost(all): 5:14:34/6:01:45, loss=0.447818813892264, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.09(1.03), norm=1.4472914755077388, lr=0.000517578918121781
2023-11-02 19:27:29   INFO  epoch: 14/30, acc_iter=19052, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:16, time_cost(all): 5:15:24/5:41:49, loss=0.447396135339581, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.89(1.03), norm=3.2983146554582063, lr=0.000515975977259612
2023-11-02 19:28:19   INFO  epoch: 14/30, acc_iter=19102, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:12, time_cost(all): 5:16:14/5:56:00, loss=0.446973456786899, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.09(1.03), norm=2.5778282124667586, lr=0.000514373036397444
2023-11-02 19:29:10   INFO  epoch: 14/30, acc_iter=19152, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:18, time_cost(all): 5:17:05/6:00:07, loss=0.446550778234217, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.93(1.03), norm=1.608534611496185, lr=0.000512770095535276
2023-11-02 19:30:00   INFO  epoch: 14/30, acc_iter=19202, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:46, time_cost(all): 5:17:55/5:41:13, loss=0.446128099681535, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.93(1.03), norm=2.8263567090469217, lr=0.000511167154673107
2023-11-02 19:30:50   INFO  epoch: 14/30, acc_iter=19252, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:23, time_cost(all): 5:18:45/5:42:10, loss=0.445705421128852, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.04(1.03), norm=2.5997103707764295, lr=0.000509564213810939
2023-11-02 19:31:41   INFO  epoch: 14/30, acc_iter=19302, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:30, time_cost(all): 5:19:36/5:51:09, loss=0.44528274257617, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.84(1.03), norm=3.463574248083125, lr=0.00050796127294877
2023-11-02 19:32:31   INFO  epoch: 14/30, acc_iter=19352, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:02, time_cost(all): 5:20:26/5:45:05, loss=0.444860064023488, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.85(1.03), norm=2.831470151490043, lr=0.000506358332086602
2023-11-02 19:33:21   INFO  epoch: 14/30, acc_iter=19402, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:54, time_cost(all): 5:21:16/5:52:03, loss=0.444437385470805, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.06(1.03), norm=1.4108019331885353, lr=0.000504755391224433
2023-11-02 19:34:12   INFO  epoch: 14/30, acc_iter=19452, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:31, time_cost(all): 5:22:07/5:46:16, loss=0.444014706918123, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.22(1.03), norm=4.304215476808773, lr=0.000503152450362265
2023-11-02 19:35:02   INFO  epoch: 14/30, acc_iter=19502, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:31, time_cost(all): 5:22:57/5:54:15, loss=0.443592028365441, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.97(1.03), norm=3.4418835795083886, lr=0.000501549509500096
2023-11-02 19:35:52   INFO  epoch: 14/30, acc_iter=19552, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:43, time_cost(all): 5:23:47/5:55:47, loss=0.443169349812758, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.93(1.03), norm=2.129575557267714, lr=0.000499946568637928
2023-11-02 19:36:43   INFO  epoch: 14/30, acc_iter=19602, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:46, time_cost(all): 5:24:38/5:52:43, loss=0.442746671260076, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.11(1.03), norm=2.03786779782118, lr=0.000498343627775759
2023-11-02 19:37:33   INFO  epoch: 14/30, acc_iter=19652, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:57, time_cost(all): 5:25:28/5:24:48, loss=0.442323992707394, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.89(1.03), norm=4.33619614972602, lr=0.000496740686913591
2023-11-02 19:38:23   INFO  epoch: 14/30, acc_iter=19702, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:08, time_cost(all): 5:26:18/5:45:28, loss=0.441901314154712, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.89(1.03), norm=2.6032113792739913, lr=0.000495137746051422
2023-11-02 19:39:14   INFO  epoch: 14/30, acc_iter=19752, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 5:27:09/5:39:12, loss=0.441478635602029, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.84(1.03), norm=3.4375014001017665, lr=0.000493534805189254
2023-11-02 19:40:04   INFO  epoch: 15/30, acc_iter=19820, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:13, time_cost(all): 5:27:59/5:25:48, loss=0.440903792770381, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.07(1.03), norm=2.5227343389828185, lr=0.000491354805616705
2023-11-02 19:40:54   INFO  epoch: 15/30, acc_iter=19870, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:50, time_cost(all): 5:28:49/5:19:15, loss=0.440481114217699, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.93(1.03), norm=0.5490874099261605, lr=0.000489751864754536
2023-11-02 19:41:45   INFO  epoch: 15/30, acc_iter=19920, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:55, time_cost(all): 5:29:40/5:25:46, loss=0.440058435665017, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.99(1.03), norm=1.0716965153904225, lr=0.000488148923892368
2023-11-02 19:42:35   INFO  epoch: 15/30, acc_iter=19970, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:21, time_cost(all): 5:30:30/5:48:22, loss=0.439635757112334, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.9(1.03), norm=1.9655815385820987, lr=0.000486545983030199
2023-11-02 19:43:25   INFO  epoch: 15/30, acc_iter=20020, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:04, time_cost(all): 5:31:20/5:25:14, loss=0.439213078559652, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.23(1.03), norm=3.8322951498909585, lr=0.000484943042168031
2023-11-02 19:44:16   INFO  epoch: 15/30, acc_iter=20070, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:35, time_cost(all): 5:32:11/5:30:44, loss=0.43879040000697, d_time=0.00(0.00), f_time=1.16(1.01), b_time=0.93(1.03), norm=0.840626931904634, lr=0.000483340101305863
2023-11-02 19:45:06   INFO  epoch: 15/30, acc_iter=20120, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:17, time_cost(all): 5:33:01/5:25:17, loss=0.438367721454287, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.88(1.03), norm=1.0454594380068158, lr=0.000481737160443694
2023-11-02 19:45:56   INFO  epoch: 15/30, acc_iter=20170, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:16, time_cost(all): 5:33:51/5:32:48, loss=0.437945042901605, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.93(1.03), norm=0.8531614145451389, lr=0.000480134219581526
2023-11-02 19:46:47   INFO  epoch: 15/30, acc_iter=20220, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:15:03, time_cost(all): 5:34:42/5:32:57, loss=0.437522364348923, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.13(1.03), norm=2.973499833394759, lr=0.000478531278719357
2023-11-02 19:47:37   INFO  epoch: 15/30, acc_iter=20270, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:23, time_cost(all): 5:35:32/5:26:31, loss=0.437099685796241, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.87(1.03), norm=4.609720919083134, lr=0.000476928337857189
2023-11-02 19:48:27   INFO  epoch: 15/30, acc_iter=20320, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:06, time_cost(all): 5:36:22/5:18:43, loss=0.436677007243558, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.87(1.03), norm=4.6758777781975995, lr=0.00047532539699502
2023-11-02 19:49:18   INFO  epoch: 15/30, acc_iter=20370, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:50, time_cost(all): 5:37:13/5:11:47, loss=0.436254328690876, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.19(1.03), norm=3.4362310009563544, lr=0.000473722456132852
2023-11-02 19:50:08   INFO  epoch: 15/30, acc_iter=20420, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:38, time_cost(all): 5:38:03/5:39:31, loss=0.435831650138194, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.14(1.03), norm=4.322291348088631, lr=0.000472119515270683
2023-11-02 19:50:58   INFO  epoch: 15/30, acc_iter=20470, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:24, time_cost(all): 5:38:53/5:20:35, loss=0.435408971585511, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.96(1.03), norm=3.1087387962046926, lr=0.000470516574408515
2023-11-02 19:51:49   INFO  epoch: 15/30, acc_iter=20520, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:12, time_cost(all): 5:39:44/5:16:23, loss=0.434986293032829, d_time=0.00(0.00), f_time=0.91(1.01), b_time=1.11(1.03), norm=4.449697229493979, lr=0.000468913633546346
2023-11-02 19:52:39   INFO  epoch: 15/30, acc_iter=20570, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:20, time_cost(all): 5:40:34/5:07:37, loss=0.434563614480147, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.09(1.03), norm=4.981715324178671, lr=0.000467310692684178
2023-11-02 19:53:29   INFO  epoch: 15/30, acc_iter=20620, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:30, time_cost(all): 5:41:24/5:15:03, loss=0.434140935927464, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.18(1.03), norm=3.294831436336759, lr=0.000465707751822009
2023-11-02 19:54:20   INFO  epoch: 15/30, acc_iter=20670, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:18, time_cost(all): 5:42:15/5:33:56, loss=0.433718257374782, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.12(1.03), norm=0.6560442388306116, lr=0.000464104810959841
2023-11-02 19:55:10   INFO  epoch: 15/30, acc_iter=20720, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:28, time_cost(all): 5:43:05/5:30:12, loss=0.4332955788221, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.17(1.03), norm=3.0955668599696624, lr=0.000462501870097673
2023-11-02 19:56:00   INFO  epoch: 15/30, acc_iter=20770, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:25, time_cost(all): 5:43:55/5:07:24, loss=0.432872900269418, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.94(1.03), norm=1.4050724018711944, lr=0.000460898929235504
2023-11-02 19:56:51   INFO  epoch: 15/30, acc_iter=20820, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:18, time_cost(all): 5:44:46/5:31:27, loss=0.432450221716735, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.87(1.03), norm=1.0128221234717352, lr=0.000459295988373336
2023-11-02 19:57:41   INFO  epoch: 15/30, acc_iter=20870, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:38, time_cost(all): 5:45:36/5:14:30, loss=0.432027543164053, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.14(1.03), norm=1.0312577623885435, lr=0.000457693047511167
2023-11-02 19:58:31   INFO  epoch: 15/30, acc_iter=20920, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:55, time_cost(all): 5:46:26/5:14:21, loss=0.431604864611371, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.98(1.03), norm=0.6079364566813068, lr=0.000456090106648999
2023-11-02 19:59:22   INFO  epoch: 15/30, acc_iter=20970, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:54, time_cost(all): 5:47:17/5:14:22, loss=0.431182186058688, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.22(1.03), norm=1.8242174381798772, lr=0.00045448716578683
2023-11-02 20:00:12   INFO  epoch: 15/30, acc_iter=21020, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 5:48:07/5:15:38, loss=0.430759507506006, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.87(1.03), norm=0.9128705652790261, lr=0.000452884224924662
2023-11-02 20:01:02   INFO  epoch: 15/30, acc_iter=21070, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 5:48:57/5:15:03, loss=0.430336828953324, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.86(1.03), norm=4.831369497268344, lr=0.000451281284062493
2023-11-02 20:01:53   INFO  epoch: 16/30, acc_iter=21138, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:30, time_cost(all): 5:49:48/5:21:38, loss=0.429761986121676, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.0(1.03), norm=3.114570234479475, lr=0.000449101284489944
2023-11-02 20:02:43   INFO  epoch: 16/30, acc_iter=21188, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:22, time_cost(all): 5:50:38/5:27:10, loss=0.429339307568994, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.95(1.03), norm=3.783758647578128, lr=0.000447498343627776
2023-11-02 20:03:33   INFO  epoch: 16/30, acc_iter=21238, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:25, time_cost(all): 5:51:28/5:10:17, loss=0.428916629016311, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.93(1.03), norm=3.192947499761321, lr=0.000445895402765607
2023-11-02 20:04:24   INFO  epoch: 16/30, acc_iter=21288, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:16, time_cost(all): 5:52:19/4:59:28, loss=0.428493950463629, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.13(1.03), norm=3.3984788032273414, lr=0.000444292461903439
2023-11-02 20:05:14   INFO  epoch: 16/30, acc_iter=21338, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:18, time_cost(all): 5:53:09/5:00:41, loss=0.428071271910947, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.06(1.03), norm=1.6036073476892267, lr=0.00044268952104127
2023-11-02 20:06:04   INFO  epoch: 16/30, acc_iter=21388, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:56, time_cost(all): 5:53:59/5:15:05, loss=0.427648593358264, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.1(1.03), norm=2.3029262188584676, lr=0.000441086580179102
2023-11-02 20:06:55   INFO  epoch: 16/30, acc_iter=21438, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:48, time_cost(all): 5:54:50/4:57:33, loss=0.427225914805582, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.2(1.03), norm=4.438307312541369, lr=0.000439483639316934
2023-11-02 20:07:45   INFO  epoch: 16/30, acc_iter=21488, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:34, time_cost(all): 5:55:40/5:22:35, loss=0.4268032362529, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.88(1.03), norm=2.591780357604371, lr=0.000437880698454765
2023-11-02 20:08:35   INFO  epoch: 16/30, acc_iter=21538, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:29, time_cost(all): 5:56:30/4:59:54, loss=0.426380557700217, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.91(1.03), norm=2.9640463638712125, lr=0.000436277757592597
2023-11-02 20:09:26   INFO  epoch: 16/30, acc_iter=21588, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:36, time_cost(all): 5:57:21/5:18:07, loss=0.425957879147535, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.05(1.03), norm=2.005091112021467, lr=0.000434674816730428
2023-11-02 20:10:16   INFO  epoch: 16/30, acc_iter=21638, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:57, time_cost(all): 5:58:11/5:10:47, loss=0.425535200594853, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.03(1.03), norm=2.8728258785569754, lr=0.00043307187586826
2023-11-02 20:11:06   INFO  epoch: 16/30, acc_iter=21688, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:53, time_cost(all): 5:59:01/4:50:15, loss=0.42511252204217, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.19(1.03), norm=2.086709161584491, lr=0.000431468935006091
2023-11-02 20:11:57   INFO  epoch: 16/30, acc_iter=21738, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:50, time_cost(all): 5:59:52/5:03:51, loss=0.424689843489488, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.21(1.03), norm=3.73141645610922, lr=0.000429865994143923
2023-11-02 20:12:47   INFO  epoch: 16/30, acc_iter=21788, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:40, time_cost(all): 6:00:42/5:05:53, loss=0.424267164936806, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.02(1.03), norm=3.6023048426961073, lr=0.000428263053281754
2023-11-02 20:13:37   INFO  epoch: 16/30, acc_iter=21838, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:52, time_cost(all): 6:01:32/4:58:31, loss=0.423844486384124, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.86(1.03), norm=2.006305266699867, lr=0.000426660112419586
2023-11-02 20:14:28   INFO  epoch: 16/30, acc_iter=21888, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:09:03, time_cost(all): 6:02:23/4:52:20, loss=0.423421807831441, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.93(1.03), norm=1.995453107590178, lr=0.000425057171557417
2023-11-02 20:15:18   INFO  epoch: 16/30, acc_iter=21938, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:30, time_cost(all): 6:03:13/5:04:43, loss=0.422999129278759, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.85(1.03), norm=1.3528646398175035, lr=0.000423454230695249
2023-11-02 20:16:08   INFO  epoch: 16/30, acc_iter=21988, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:40, time_cost(all): 6:04:03/4:58:25, loss=0.422576450726077, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.89(1.03), norm=2.842107712175429, lr=0.00042185128983308
2023-11-02 20:16:59   INFO  epoch: 16/30, acc_iter=22038, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:53, time_cost(all): 6:04:54/4:51:13, loss=0.422153772173394, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.14(1.03), norm=2.7696767567637277, lr=0.000420248348970912
2023-11-02 20:17:49   INFO  epoch: 16/30, acc_iter=22088, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:10, time_cost(all): 6:05:44/5:07:02, loss=0.421731093620712, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.17(1.03), norm=1.0293984939644172, lr=0.000418645408108744
2023-11-02 20:18:39   INFO  epoch: 16/30, acc_iter=22138, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:19, time_cost(all): 6:06:34/4:49:04, loss=0.42130841506803, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.19(1.03), norm=2.3822359828046666, lr=0.000417042467246575
2023-11-02 20:19:30   INFO  epoch: 16/30, acc_iter=22188, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:48, time_cost(all): 6:07:25/4:55:41, loss=0.420885736515347, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.04(1.03), norm=2.764230993501721, lr=0.000415439526384407
2023-11-02 20:20:20   INFO  epoch: 16/30, acc_iter=22238, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:52, time_cost(all): 6:08:15/4:45:34, loss=0.420463057962665, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.94(1.03), norm=1.857962975081367, lr=0.000413836585522238
2023-11-02 20:21:10   INFO  epoch: 16/30, acc_iter=22288, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:54, time_cost(all): 6:09:05/4:43:18, loss=0.420040379409983, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.01(1.03), norm=4.71763408806367, lr=0.00041223364466007
2023-11-02 20:22:01   INFO  epoch: 16/30, acc_iter=22338, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:05, time_cost(all): 6:09:56/5:00:27, loss=0.419617700857301, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.1(1.03), norm=3.182253504239471, lr=0.000410630703797901
2023-11-02 20:22:51   INFO  epoch: 16/30, acc_iter=22388, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 6:10:46/4:51:50, loss=0.419195022304618, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.93(1.03), norm=3.6134062974488166, lr=0.000409027762935733
2023-11-02 20:23:41   INFO  epoch: 17/30, acc_iter=22456, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:38, time_cost(all): 6:11:36/5:02:55, loss=0.41862017947297, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.9(1.03), norm=4.8009437587386845, lr=0.000406847763363184
2023-11-02 20:24:32   INFO  epoch: 17/30, acc_iter=22506, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:46, time_cost(all): 6:12:27/4:55:31, loss=0.418197500920288, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.98(1.03), norm=3.1834499940806804, lr=0.000405244822501015
2023-11-02 20:25:22   INFO  epoch: 17/30, acc_iter=22556, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:41, time_cost(all): 6:13:17/4:38:50, loss=0.417774822367606, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.15(1.03), norm=1.2410911529149868, lr=0.000403641881638847
2023-11-02 20:26:12   INFO  epoch: 17/30, acc_iter=22606, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:57, time_cost(all): 6:14:07/4:58:06, loss=0.417352143814923, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.1(1.03), norm=2.0064293445294745, lr=0.000402038940776678
2023-11-02 20:27:03   INFO  epoch: 17/30, acc_iter=22656, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:09, time_cost(all): 6:14:58/4:39:23, loss=0.416929465262241, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.86(1.03), norm=1.5834632974132612, lr=0.00040043599991451
2023-11-02 20:27:53   INFO  epoch: 17/30, acc_iter=22706, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:37, time_cost(all): 6:15:48/4:46:39, loss=0.416506786709559, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.13(1.03), norm=3.6549832756460963, lr=0.000398833059052341
2023-11-02 20:28:43   INFO  epoch: 17/30, acc_iter=22756, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:15:29, time_cost(all): 6:16:38/4:58:37, loss=0.416084108156876, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.98(1.03), norm=4.113431743084446, lr=0.000397230118190173
2023-11-02 20:29:34   INFO  epoch: 17/30, acc_iter=22806, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:58, time_cost(all): 6:17:29/4:47:37, loss=0.415661429604194, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.15(1.03), norm=2.289085435466714, lr=0.000395627177328004
2023-11-02 20:30:24   INFO  epoch: 17/30, acc_iter=22856, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:46, time_cost(all): 6:18:19/4:54:33, loss=0.415238751051512, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.18(1.03), norm=3.971536338273839, lr=0.000394024236465836
2023-11-02 20:31:14   INFO  epoch: 17/30, acc_iter=22906, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:16, time_cost(all): 6:19:09/4:52:41, loss=0.41481607249883, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.09(1.03), norm=2.8220361862167316, lr=0.000392421295603668
2023-11-02 20:32:05   INFO  epoch: 17/30, acc_iter=22956, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:44, time_cost(all): 6:20:00/4:34:59, loss=0.414393393946147, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.16(1.03), norm=1.9428059473890509, lr=0.000390818354741499
2023-11-02 20:32:55   INFO  epoch: 17/30, acc_iter=23006, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:12, time_cost(all): 6:20:50/4:49:19, loss=0.413970715393465, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.03(1.03), norm=1.188211813924052, lr=0.000389215413879331
2023-11-02 20:33:45   INFO  epoch: 17/30, acc_iter=23056, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:08, time_cost(all): 6:21:40/4:54:25, loss=0.413548036840783, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.95(1.03), norm=0.5376115431684336, lr=0.000387612473017162
2023-11-02 20:34:36   INFO  epoch: 17/30, acc_iter=23106, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:17, time_cost(all): 6:22:31/4:38:23, loss=0.4131253582881, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.14(1.03), norm=2.1436548588707374, lr=0.000386009532154994
2023-11-02 20:35:26   INFO  epoch: 17/30, acc_iter=23156, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:05, time_cost(all): 6:23:21/4:49:38, loss=0.412702679735418, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.86(1.03), norm=4.349864107120353, lr=0.000384406591292825
2023-11-02 20:36:16   INFO  epoch: 17/30, acc_iter=23206, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:38, time_cost(all): 6:24:11/4:46:53, loss=0.412280001182736, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.21(1.03), norm=3.5253922627541034, lr=0.000382803650430657
2023-11-02 20:37:07   INFO  epoch: 17/30, acc_iter=23256, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:58, time_cost(all): 6:25:02/4:28:12, loss=0.411857322630053, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.2(1.03), norm=2.104619180516649, lr=0.000381200709568488
2023-11-02 20:37:57   INFO  epoch: 17/30, acc_iter=23306, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:19, time_cost(all): 6:25:52/4:33:28, loss=0.411434644077371, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.02(1.03), norm=1.9585837306748402, lr=0.00037959776870632
2023-11-02 20:38:47   INFO  epoch: 17/30, acc_iter=23356, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:09, time_cost(all): 6:26:42/4:40:18, loss=0.411011965524689, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.06(1.03), norm=1.910972610463159, lr=0.000377994827844152
2023-11-02 20:39:38   INFO  epoch: 17/30, acc_iter=23406, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:13, time_cost(all): 6:27:33/4:41:42, loss=0.410589286972007, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.17(1.03), norm=3.7841921916931085, lr=0.000376391886981983
2023-11-02 20:40:28   INFO  epoch: 17/30, acc_iter=23456, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:39, time_cost(all): 6:28:23/4:37:22, loss=0.410166608419324, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.03(1.03), norm=1.822139028760133, lr=0.000374788946119815
2023-11-02 20:41:18   INFO  epoch: 17/30, acc_iter=23506, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:36, time_cost(all): 6:29:13/4:46:59, loss=0.409743929866642, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.98(1.03), norm=0.553752394862816, lr=0.000373186005257646
2023-11-02 20:42:09   INFO  epoch: 17/30, acc_iter=23556, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:45, time_cost(all): 6:30:04/4:31:05, loss=0.40932125131396, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.22(1.03), norm=1.323685117563786, lr=0.000371583064395478
2023-11-02 20:42:59   INFO  epoch: 17/30, acc_iter=23606, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:02, time_cost(all): 6:30:54/4:40:12, loss=0.408898572761277, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.91(1.03), norm=3.6410518593419634, lr=0.000369980123533309
2023-11-02 20:43:49   INFO  epoch: 17/30, acc_iter=23656, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:11, time_cost(all): 6:31:44/4:19:44, loss=0.408475894208595, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.92(1.03), norm=4.863363989666688, lr=0.000368377182671141
2023-11-02 20:44:40   INFO  epoch: 17/30, acc_iter=23706, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 6:32:35/4:36:56, loss=0.408053215655913, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.07(1.03), norm=1.2100948876246131, lr=0.000366774241808972
2023-11-02 20:45:30   INFO  epoch: 18/30, acc_iter=23774, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:19, time_cost(all): 6:33:25/4:35:16, loss=0.407478372824265, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.05(1.03), norm=4.803151303140756, lr=0.000364594242236423
2023-11-02 20:46:20   INFO  epoch: 18/30, acc_iter=23824, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:11, time_cost(all): 6:34:15/4:41:12, loss=0.407055694271583, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.19(1.03), norm=3.3684354630978848, lr=0.000362991301374255
2023-11-02 20:47:11   INFO  epoch: 18/30, acc_iter=23874, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:54, time_cost(all): 6:35:06/4:38:33, loss=0.4066330157189, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.02(1.03), norm=0.8654941387569924, lr=0.000361388360512086
2023-11-02 20:48:01   INFO  epoch: 18/30, acc_iter=23924, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:23, time_cost(all): 6:35:56/4:38:06, loss=0.406210337166218, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.92(1.03), norm=3.3527054916980514, lr=0.000359785419649918
2023-11-02 20:48:51   INFO  epoch: 18/30, acc_iter=23974, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:08, time_cost(all): 6:36:46/4:29:05, loss=0.405787658613536, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.04(1.03), norm=2.902037310856314, lr=0.000358182478787749
2023-11-02 20:49:42   INFO  epoch: 18/30, acc_iter=24024, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:06, time_cost(all): 6:37:37/4:23:45, loss=0.405364980060853, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.84(1.03), norm=1.1036956026849245, lr=0.000356579537925581
2023-11-02 20:50:32   INFO  epoch: 18/30, acc_iter=24074, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:05, time_cost(all): 6:38:27/4:25:11, loss=0.404942301508171, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.07(1.03), norm=2.5795038418293204, lr=0.000354976597063412
2023-11-02 20:51:22   INFO  epoch: 18/30, acc_iter=24124, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:51, time_cost(all): 6:39:17/4:20:47, loss=0.404519622955489, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.06(1.03), norm=4.478321610924471, lr=0.000353373656201244
2023-11-02 20:52:13   INFO  epoch: 18/30, acc_iter=24174, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:11, time_cost(all): 6:40:08/4:31:26, loss=0.404096944402806, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.03(1.03), norm=3.1704819463092586, lr=0.000351770715339076
2023-11-02 20:53:03   INFO  epoch: 18/30, acc_iter=24224, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:48, time_cost(all): 6:40:58/4:15:58, loss=0.403674265850124, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.88(1.03), norm=1.277787697968194, lr=0.000350167774476907
2023-11-02 20:53:53   INFO  epoch: 18/30, acc_iter=24274, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:01, time_cost(all): 6:41:48/4:22:53, loss=0.403251587297442, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.93(1.03), norm=3.253657476318623, lr=0.000348564833614739
2023-11-02 20:54:44   INFO  epoch: 18/30, acc_iter=24324, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:47, time_cost(all): 6:42:39/4:17:26, loss=0.402828908744759, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.2(1.03), norm=2.9119054011621612, lr=0.00034696189275257
2023-11-02 20:55:34   INFO  epoch: 18/30, acc_iter=24374, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:44, time_cost(all): 6:43:29/4:18:54, loss=0.402406230192077, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.07(1.03), norm=0.8014525733316162, lr=0.000345358951890402
2023-11-02 20:56:24   INFO  epoch: 18/30, acc_iter=24424, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:09:52, time_cost(all): 6:44:19/4:17:23, loss=0.401983551639395, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.92(1.03), norm=1.1806916461069041, lr=0.000343756011028233
2023-11-02 20:57:15   INFO  epoch: 18/30, acc_iter=24474, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:19, time_cost(all): 6:45:10/4:23:03, loss=0.401560873086713, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.97(1.03), norm=3.503403627694481, lr=0.000342153070166065
2023-11-02 20:58:05   INFO  epoch: 18/30, acc_iter=24524, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:44, time_cost(all): 6:46:00/4:19:20, loss=0.40113819453403, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.12(1.03), norm=2.7904997522312716, lr=0.000340550129303896
2023-11-02 20:58:55   INFO  epoch: 18/30, acc_iter=24574, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:38, time_cost(all): 6:46:50/4:26:56, loss=0.400715515981348, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.06(1.03), norm=2.142457918223007, lr=0.000338947188441728
2023-11-02 20:59:46   INFO  epoch: 18/30, acc_iter=24624, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:42, time_cost(all): 6:47:41/4:04:58, loss=0.400292837428666, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.84(1.03), norm=2.442388388745613, lr=0.000337344247579559
2023-11-02 21:00:36   INFO  epoch: 18/30, acc_iter=24674, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:08, time_cost(all): 6:48:31/4:06:17, loss=0.399870158875983, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.88(1.03), norm=2.161848655698548, lr=0.000335741306717391
2023-11-02 21:01:26   INFO  epoch: 18/30, acc_iter=24724, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:21, time_cost(all): 6:49:21/4:08:39, loss=0.399447480323301, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.98(1.03), norm=1.911128280916482, lr=0.000334138365855223
2023-11-02 21:02:17   INFO  epoch: 18/30, acc_iter=24774, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:29, time_cost(all): 6:50:12/4:24:29, loss=0.399024801770619, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.07(1.03), norm=3.0048672866684023, lr=0.000332535424993054
2023-11-02 21:03:07   INFO  epoch: 18/30, acc_iter=24824, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:32, time_cost(all): 6:51:02/4:04:31, loss=0.398602123217936, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.04(1.03), norm=1.7259726458345335, lr=0.000330932484130885
2023-11-02 21:03:57   INFO  epoch: 18/30, acc_iter=24874, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:56, time_cost(all): 6:51:52/4:02:42, loss=0.398179444665254, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.95(1.03), norm=3.9342676981053066, lr=0.000329329543268717
2023-11-02 21:04:48   INFO  epoch: 18/30, acc_iter=24924, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:53, time_cost(all): 6:52:43/4:13:01, loss=0.397756766112572, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.84(1.03), norm=3.004595413771264, lr=0.000327726602406549
2023-11-02 21:05:38   INFO  epoch: 18/30, acc_iter=24974, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:10, time_cost(all): 6:53:33/4:15:51, loss=0.39733408755989, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.99(1.03), norm=1.4882601666320896, lr=0.00032612366154438
2023-11-02 21:06:28   INFO  epoch: 18/30, acc_iter=25024, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 6:54:23/4:04:20, loss=0.396911409007207, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.12(1.03), norm=2.160348941111267, lr=0.000324520720682212
2023-11-02 21:07:18   INFO  epoch: 19/30, acc_iter=25092, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:04, time_cost(all): 6:55:13/4:17:48, loss=0.396336566175559, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.1(1.03), norm=3.4910348654117485, lr=0.000322340721109663
2023-11-02 21:08:09   INFO  epoch: 19/30, acc_iter=25142, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:09, time_cost(all): 6:56:04/4:19:07, loss=0.395913887622877, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.87(1.03), norm=1.6152466815364521, lr=0.000320737780247494
2023-11-02 21:08:59   INFO  epoch: 19/30, acc_iter=25192, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:47, time_cost(all): 6:56:54/4:02:29, loss=0.395491209070195, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.84(1.03), norm=1.122519104745929, lr=0.000319134839385326
2023-11-02 21:09:49   INFO  epoch: 19/30, acc_iter=25242, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:57, time_cost(all): 6:57:44/4:17:40, loss=0.395068530517512, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.14(1.03), norm=0.8378828187541374, lr=0.000317531898523157
2023-11-02 21:10:40   INFO  epoch: 19/30, acc_iter=25292, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:51, time_cost(all): 6:58:35/3:52:38, loss=0.39464585196483, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.98(1.03), norm=3.6957380234527477, lr=0.000315928957660989
2023-11-02 21:11:30   INFO  epoch: 19/30, acc_iter=25342, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:32, time_cost(all): 6:59:25/4:09:49, loss=0.394223173412148, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.85(1.03), norm=4.343271764123682, lr=0.00031432601679882
2023-11-02 21:12:20   INFO  epoch: 19/30, acc_iter=25392, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:25, time_cost(all): 7:00:15/3:52:30, loss=0.393800494859465, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.04(1.03), norm=2.4980397689942464, lr=0.000312723075936652
2023-11-02 21:13:11   INFO  epoch: 19/30, acc_iter=25442, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:22, time_cost(all): 7:01:06/4:11:16, loss=0.393377816306783, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.1(1.03), norm=4.354374470198982, lr=0.000311120135074483
2023-11-02 21:14:01   INFO  epoch: 19/30, acc_iter=25492, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:00, time_cost(all): 7:01:56/4:06:53, loss=0.392955137754101, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.96(1.03), norm=3.9622330481752086, lr=0.000309517194212315
2023-11-02 21:14:51   INFO  epoch: 19/30, acc_iter=25542, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:03, time_cost(all): 7:02:46/3:49:16, loss=0.392532459201419, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.18(1.03), norm=1.7400215352462343, lr=0.000307914253350146
2023-11-02 21:15:42   INFO  epoch: 19/30, acc_iter=25592, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:16, time_cost(all): 7:03:37/3:55:10, loss=0.392109780648736, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.94(1.03), norm=1.6038544378633022, lr=0.000306311312487978
2023-11-02 21:16:32   INFO  epoch: 19/30, acc_iter=25642, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:29, time_cost(all): 7:04:27/4:04:52, loss=0.391687102096054, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.97(1.03), norm=2.1949694013569307, lr=0.00030470837162581
2023-11-02 21:17:22   INFO  epoch: 19/30, acc_iter=25692, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:28, time_cost(all): 7:05:17/4:07:16, loss=0.391264423543372, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.96(1.03), norm=3.412075288300221, lr=0.000303105430763641
2023-11-02 21:18:13   INFO  epoch: 19/30, acc_iter=25742, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:01, time_cost(all): 7:06:08/3:47:44, loss=0.390841744990689, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.12(1.03), norm=4.51530243501563, lr=0.000301502489901473
2023-11-02 21:19:03   INFO  epoch: 19/30, acc_iter=25792, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:15, time_cost(all): 7:06:58/4:07:16, loss=0.390419066438007, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.96(1.03), norm=1.7034414653606451, lr=0.000299899549039304
2023-11-02 21:19:53   INFO  epoch: 19/30, acc_iter=25842, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:40, time_cost(all): 7:07:48/3:57:03, loss=0.389996387885325, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.99(1.03), norm=1.2344621270924576, lr=0.000298296608177136
2023-11-02 21:20:44   INFO  epoch: 19/30, acc_iter=25892, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:31, time_cost(all): 7:08:39/4:05:35, loss=0.389573709332642, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.03(1.03), norm=2.9840671663798872, lr=0.000296693667314967
2023-11-02 21:21:34   INFO  epoch: 19/30, acc_iter=25942, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:59, time_cost(all): 7:09:29/3:47:16, loss=0.38915103077996, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.92(1.03), norm=1.6333079338756544, lr=0.000295090726452799
2023-11-02 21:22:24   INFO  epoch: 19/30, acc_iter=25992, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:05, time_cost(all): 7:10:19/3:41:22, loss=0.388728352227278, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.96(1.03), norm=3.434781779541959, lr=0.00029348778559063
2023-11-02 21:23:15   INFO  epoch: 19/30, acc_iter=26042, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:09, time_cost(all): 7:11:10/4:02:12, loss=0.388305673674596, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.0(1.03), norm=1.1376437879633765, lr=0.000291884844728462
2023-11-02 21:24:05   INFO  epoch: 19/30, acc_iter=26092, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:28, time_cost(all): 7:12:00/3:48:25, loss=0.387882995121913, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.9(1.03), norm=4.031071485694171, lr=0.000290281903866293
2023-11-02 21:24:55   INFO  epoch: 19/30, acc_iter=26142, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:45, time_cost(all): 7:12:50/3:44:25, loss=0.387460316569231, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.89(1.03), norm=2.598264942214102, lr=0.000288678963004125
2023-11-02 21:25:46   INFO  epoch: 19/30, acc_iter=26192, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:45, time_cost(all): 7:13:41/3:41:45, loss=0.387037638016549, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.13(1.03), norm=3.323689007091309, lr=0.000287076022141957
2023-11-02 21:26:36   INFO  epoch: 19/30, acc_iter=26242, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:58, time_cost(all): 7:14:31/3:55:17, loss=0.386614959463866, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.13(1.03), norm=1.0817162686570083, lr=0.000285473081279788
2023-11-02 21:27:26   INFO  epoch: 19/30, acc_iter=26292, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:08, time_cost(all): 7:15:21/3:55:22, loss=0.386192280911184, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.84(1.03), norm=2.6711819512617625, lr=0.00028387014041762
2023-11-02 21:28:17   INFO  epoch: 19/30, acc_iter=26342, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 7:16:12/3:51:46, loss=0.385769602358502, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.06(1.03), norm=4.306512591517703, lr=0.000282267199555451
2023-11-02 21:29:07   INFO  epoch: 20/30, acc_iter=26410, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:47, time_cost(all): 7:17:02/3:56:08, loss=0.385194759526854, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.93(1.03), norm=1.5554110769281284, lr=0.000280087199982902
2023-11-02 21:29:57   INFO  epoch: 20/30, acc_iter=26460, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:05, time_cost(all): 7:17:52/3:44:59, loss=0.384772080974171, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.93(1.03), norm=1.139018565129208, lr=0.000278484259120734
2023-11-02 21:30:48   INFO  epoch: 20/30, acc_iter=26510, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:16, time_cost(all): 7:18:43/3:49:02, loss=0.384349402421489, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.22(1.03), norm=4.819485808803716, lr=0.000276881318258565
2023-11-02 21:31:38   INFO  epoch: 20/30, acc_iter=26560, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:17, time_cost(all): 7:19:33/3:40:56, loss=0.383926723868807, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.94(1.03), norm=2.012483765908991, lr=0.000275278377396397
2023-11-02 21:32:28   INFO  epoch: 20/30, acc_iter=26610, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:09, time_cost(all): 7:20:23/3:37:34, loss=0.383504045316125, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.16(1.03), norm=3.369666242447298, lr=0.000273675436534228
2023-11-02 21:33:19   INFO  epoch: 20/30, acc_iter=26660, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:49, time_cost(all): 7:21:14/3:32:41, loss=0.383081366763442, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.04(1.03), norm=3.376064214754066, lr=0.00027207249567206
2023-11-02 21:34:09   INFO  epoch: 20/30, acc_iter=26710, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:40, time_cost(all): 7:22:04/3:36:44, loss=0.38265868821076, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.2(1.03), norm=2.437383677542096, lr=0.000270469554809891
2023-11-02 21:34:59   INFO  epoch: 20/30, acc_iter=26760, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:39, time_cost(all): 7:22:54/3:41:40, loss=0.382236009658078, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.97(1.03), norm=3.3989174588200677, lr=0.000268866613947723
2023-11-02 21:35:50   INFO  epoch: 20/30, acc_iter=26810, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:12, time_cost(all): 7:23:45/3:33:09, loss=0.381813331105395, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.04(1.03), norm=2.1448960689010472, lr=0.000267263673085554
2023-11-02 21:36:40   INFO  epoch: 20/30, acc_iter=26860, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:23, time_cost(all): 7:24:35/3:38:59, loss=0.381390652552713, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.9(1.03), norm=1.7912522530284474, lr=0.000265660732223386
2023-11-02 21:37:30   INFO  epoch: 20/30, acc_iter=26910, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:19, time_cost(all): 7:25:25/3:40:38, loss=0.380967974000031, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.89(1.03), norm=3.174925767323805, lr=0.000264057791361217
2023-11-02 21:38:21   INFO  epoch: 20/30, acc_iter=26960, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:36, time_cost(all): 7:26:16/3:34:02, loss=0.380545295447348, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.18(1.03), norm=4.036141529684965, lr=0.000262454850499049
2023-11-02 21:39:11   INFO  epoch: 20/30, acc_iter=27010, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:34, time_cost(all): 7:27:06/3:36:39, loss=0.380122616894666, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.03(1.03), norm=0.7602580908000647, lr=0.000260851909636881
2023-11-02 21:40:01   INFO  epoch: 20/30, acc_iter=27060, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:40, time_cost(all): 7:27:56/3:45:11, loss=0.379699938341984, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.13(1.03), norm=1.3827666399298681, lr=0.000259248968774712
2023-11-02 21:40:52   INFO  epoch: 20/30, acc_iter=27110, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:46, time_cost(all): 7:28:47/3:31:25, loss=0.379277259789302, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.17(1.03), norm=4.6539536948854545, lr=0.000257646027912544
2023-11-02 21:41:42   INFO  epoch: 20/30, acc_iter=27160, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:41, time_cost(all): 7:29:37/3:31:51, loss=0.378854581236619, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.05(1.03), norm=4.208313446584301, lr=0.000256043087050375
2023-11-02 21:42:32   INFO  epoch: 20/30, acc_iter=27210, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:54, time_cost(all): 7:30:27/3:40:50, loss=0.378431902683937, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.91(1.03), norm=2.6735237486306396, lr=0.000254440146188207
2023-11-02 21:43:23   INFO  epoch: 20/30, acc_iter=27260, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:55, time_cost(all): 7:31:18/3:41:13, loss=0.378009224131255, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.07(1.03), norm=3.9554204993803355, lr=0.000252837205326038
2023-11-02 21:44:13   INFO  epoch: 20/30, acc_iter=27310, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:16, time_cost(all): 7:32:08/3:38:13, loss=0.377586545578572, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.05(1.03), norm=2.5941638836058, lr=0.00025123426446387
2023-11-02 21:45:03   INFO  epoch: 20/30, acc_iter=27360, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:07, time_cost(all): 7:32:58/3:31:13, loss=0.37716386702589, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.86(1.03), norm=3.0062139230976372, lr=0.000249631323601701
2023-11-02 21:45:54   INFO  epoch: 20/30, acc_iter=27410, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:40, time_cost(all): 7:33:49/3:19:17, loss=0.376741188473208, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.02(1.03), norm=4.3335776733266, lr=0.000248028382739533
2023-11-02 21:46:44   INFO  epoch: 20/30, acc_iter=27460, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:35, time_cost(all): 7:34:39/3:30:13, loss=0.376318509920525, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.17(1.03), norm=4.710820961232667, lr=0.000246425441877364
2023-11-02 21:47:34   INFO  epoch: 20/30, acc_iter=27510, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:50, time_cost(all): 7:35:29/3:35:00, loss=0.375895831367843, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.14(1.03), norm=0.518958421491444, lr=0.000244822501015196
2023-11-02 21:48:25   INFO  epoch: 20/30, acc_iter=27560, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:58, time_cost(all): 7:36:20/3:32:38, loss=0.375473152815161, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.97(1.03), norm=3.371226076405685, lr=0.000243219560153028
2023-11-02 21:49:15   INFO  epoch: 20/30, acc_iter=27610, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 7:37:10/3:19:50, loss=0.375050474262479, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.88(1.03), norm=2.3102164778427787, lr=0.000241616619290859
2023-11-02 21:50:05   INFO  epoch: 20/30, acc_iter=27660, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 7:38:00/3:28:26, loss=0.374627795709796, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.91(1.03), norm=2.3742035816950495, lr=0.000240013678428691
2023-11-02 21:50:56   INFO  epoch: 21/30, acc_iter=27728, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:09, time_cost(all): 7:38:51/3:31:30, loss=0.374052952878148, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.17(1.03), norm=2.5005584389422957, lr=0.000237833678856141
2023-11-02 21:51:46   INFO  epoch: 21/30, acc_iter=27778, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:38, time_cost(all): 7:39:41/3:22:23, loss=0.373630274325466, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.12(1.03), norm=3.093171565910232, lr=0.000236230737993973
2023-11-02 21:52:36   INFO  epoch: 21/30, acc_iter=27828, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:07, time_cost(all): 7:40:31/3:23:07, loss=0.373207595772784, d_time=0.00(0.00), f_time=1.21(1.01), b_time=1.17(1.03), norm=3.3484569094027083, lr=0.000234627797131805
2023-11-02 21:53:27   INFO  epoch: 21/30, acc_iter=27878, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:11, time_cost(all): 7:41:22/3:23:54, loss=0.372784917220101, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.06(1.03), norm=1.9398694284479197, lr=0.000233024856269636
2023-11-02 21:54:17   INFO  epoch: 21/30, acc_iter=27928, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:12, time_cost(all): 7:42:12/3:12:00, loss=0.372362238667419, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.03(1.03), norm=4.273080335729449, lr=0.000231421915407468
2023-11-02 21:55:07   INFO  epoch: 21/30, acc_iter=27978, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:21, time_cost(all): 7:43:02/3:20:53, loss=0.371939560114737, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.91(1.03), norm=3.341205891138485, lr=0.000229818974545299
2023-11-02 21:55:58   INFO  epoch: 21/30, acc_iter=28028, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:25, time_cost(all): 7:43:53/3:16:47, loss=0.371516881562054, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.19(1.03), norm=4.262339103803507, lr=0.000228216033683131
2023-11-02 21:56:48   INFO  epoch: 21/30, acc_iter=28078, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:48, time_cost(all): 7:44:43/3:09:41, loss=0.371094203009372, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.0(1.03), norm=0.6738921436503733, lr=0.000226613092820962
2023-11-02 21:57:38   INFO  epoch: 21/30, acc_iter=28128, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:12, time_cost(all): 7:45:33/3:12:21, loss=0.37067152445669, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.06(1.03), norm=2.01957221795863, lr=0.000225010151958794
2023-11-02 21:58:29   INFO  epoch: 21/30, acc_iter=28178, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:14:00, time_cost(all): 7:46:24/3:07:24, loss=0.370248845904008, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.2(1.03), norm=2.034779294264196, lr=0.000223407211096625
2023-11-02 21:59:19   INFO  epoch: 21/30, acc_iter=28228, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:17, time_cost(all): 7:47:14/3:21:32, loss=0.369826167351325, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.91(1.03), norm=3.7538751042196195, lr=0.000221804270234457
2023-11-02 22:00:09   INFO  epoch: 21/30, acc_iter=28278, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:22, time_cost(all): 7:48:04/3:06:51, loss=0.369403488798643, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.15(1.03), norm=4.3542947106261565, lr=0.000220201329372289
2023-11-02 22:01:00   INFO  epoch: 21/30, acc_iter=28328, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:00, time_cost(all): 7:48:55/3:07:33, loss=0.368980810245961, d_time=0.00(0.00), f_time=1.21(1.01), b_time=1.19(1.03), norm=4.8484334223196806, lr=0.00021859838851012
2023-11-02 22:01:50   INFO  epoch: 21/30, acc_iter=28378, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:29, time_cost(all): 7:49:45/3:12:06, loss=0.368558131693278, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.93(1.03), norm=2.258980429977, lr=0.000216995447647951
2023-11-02 22:02:40   INFO  epoch: 21/30, acc_iter=28428, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:31, time_cost(all): 7:50:35/3:14:23, loss=0.368135453140596, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.91(1.03), norm=1.9555266700750265, lr=0.000215392506785783
2023-11-02 22:03:31   INFO  epoch: 21/30, acc_iter=28478, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:57, time_cost(all): 7:51:26/3:14:42, loss=0.367712774587914, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.13(1.03), norm=3.69741068958755, lr=0.000213789565923615
2023-11-02 22:04:21   INFO  epoch: 21/30, acc_iter=28528, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:31, time_cost(all): 7:52:16/3:12:26, loss=0.367290096035231, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.86(1.03), norm=4.606768605591838, lr=0.000212186625061446
2023-11-02 22:05:11   INFO  epoch: 21/30, acc_iter=28578, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:51, time_cost(all): 7:53:06/3:08:20, loss=0.366867417482549, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.1(1.03), norm=4.208895448146846, lr=0.000210583684199278
2023-11-02 22:06:02   INFO  epoch: 21/30, acc_iter=28628, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:59, time_cost(all): 7:53:57/3:17:52, loss=0.366444738929867, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.21(1.03), norm=0.7951604994596139, lr=0.000208980743337109
2023-11-02 22:06:52   INFO  epoch: 21/30, acc_iter=28678, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:07, time_cost(all): 7:54:47/3:11:40, loss=0.366022060377185, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.87(1.03), norm=1.7092951193475645, lr=0.000207377802474941
2023-11-02 22:07:42   INFO  epoch: 21/30, acc_iter=28728, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:36, time_cost(all): 7:55:37/3:10:14, loss=0.365599381824502, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.18(1.03), norm=3.9726423685831964, lr=0.000205774861612772
2023-11-02 22:08:33   INFO  epoch: 21/30, acc_iter=28778, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:44, time_cost(all): 7:56:28/3:04:45, loss=0.36517670327182, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.0(1.03), norm=3.1788620223509803, lr=0.000204171920750604
2023-11-02 22:09:23   INFO  epoch: 21/30, acc_iter=28828, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:41, time_cost(all): 7:57:18/3:07:30, loss=0.364754024719138, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.21(1.03), norm=2.375475445082713, lr=0.000202568979888435
2023-11-02 22:10:13   INFO  epoch: 21/30, acc_iter=28878, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:57, time_cost(all): 7:58:08/2:57:02, loss=0.364331346166455, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.84(1.03), norm=1.6743830997668985, lr=0.000200966039026267
2023-11-02 22:11:04   INFO  epoch: 21/30, acc_iter=28928, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 7:58:59/3:05:24, loss=0.363908667613773, d_time=0.00(0.00), f_time=0.91(1.01), b_time=1.13(1.03), norm=2.2728287244489653, lr=0.000199363098164098
2023-11-02 22:11:54   INFO  epoch: 21/30, acc_iter=28978, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 7:59:49/2:58:18, loss=0.363485989061091, d_time=0.00(0.00), f_time=1.2(1.01), b_time=1.17(1.03), norm=0.8593244187485964, lr=0.00019776015730193
2023-11-02 22:12:44   INFO  epoch: 22/30, acc_iter=29046, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:50, time_cost(all): 8:00:39/2:55:10, loss=0.362911146229443, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.97(1.03), norm=3.374779373979947, lr=0.000195580157729381
2023-11-02 22:13:35   INFO  epoch: 22/30, acc_iter=29096, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:27, time_cost(all): 8:01:30/3:07:15, loss=0.36248846767676, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.17(1.03), norm=2.3018744065042, lr=0.000193977216867212
2023-11-02 22:14:25   INFO  epoch: 22/30, acc_iter=29146, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:58, time_cost(all): 8:02:20/3:03:18, loss=0.362065789124078, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.11(1.03), norm=1.6354641604488305, lr=0.000192374276005044
2023-11-02 22:15:15   INFO  epoch: 22/30, acc_iter=29196, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:58, time_cost(all): 8:03:10/2:54:38, loss=0.361643110571396, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.84(1.03), norm=4.595924497960838, lr=0.000190771335142876
2023-11-02 22:16:06   INFO  epoch: 22/30, acc_iter=29246, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:06, time_cost(all): 8:04:01/2:57:56, loss=0.361220432018714, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.85(1.03), norm=1.4882910048008813, lr=0.000189168394280707
2023-11-02 22:16:56   INFO  epoch: 22/30, acc_iter=29296, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:57, time_cost(all): 8:04:51/2:56:56, loss=0.360797753466031, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.13(1.03), norm=1.7361819350548438, lr=0.000187565453418539
2023-11-02 22:17:46   INFO  epoch: 22/30, acc_iter=29346, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:22, time_cost(all): 8:05:41/2:50:46, loss=0.360375074913349, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.86(1.03), norm=0.7666680446261032, lr=0.00018596251255637
2023-11-02 22:18:37   INFO  epoch: 22/30, acc_iter=29396, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:10, time_cost(all): 8:06:32/2:52:01, loss=0.359952396360667, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.16(1.03), norm=0.7210826716494856, lr=0.000184359571694202
2023-11-02 22:19:27   INFO  epoch: 22/30, acc_iter=29446, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:15:08, time_cost(all): 8:07:22/2:51:04, loss=0.359529717807984, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.85(1.03), norm=1.6842515883367297, lr=0.000182756630832033
2023-11-02 22:20:17   INFO  epoch: 22/30, acc_iter=29496, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:42, time_cost(all): 8:08:12/3:02:48, loss=0.359107039255302, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.03(1.03), norm=4.408033019532708, lr=0.000181153689969865
2023-11-02 22:21:08   INFO  epoch: 22/30, acc_iter=29546, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:18, time_cost(all): 8:09:03/2:45:41, loss=0.35868436070262, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.85(1.03), norm=1.056348314784076, lr=0.000179550749107696
2023-11-02 22:21:58   INFO  epoch: 22/30, acc_iter=29596, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:44, time_cost(all): 8:09:53/2:46:52, loss=0.358261682149937, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.16(1.03), norm=3.171667482328693, lr=0.000177947808245528
2023-11-02 22:22:48   INFO  epoch: 22/30, acc_iter=29646, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:47, time_cost(all): 8:10:43/2:49:01, loss=0.357839003597255, d_time=0.00(0.00), f_time=0.98(1.01), b_time=0.99(1.03), norm=3.126181965982761, lr=0.000176344867383359
2023-11-02 22:23:39   INFO  epoch: 22/30, acc_iter=29696, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:07, time_cost(all): 8:11:34/2:58:46, loss=0.357416325044573, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.17(1.03), norm=2.767852112552357, lr=0.000174741926521191
2023-11-02 22:24:29   INFO  epoch: 22/30, acc_iter=29746, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:19, time_cost(all): 8:12:24/2:46:27, loss=0.356993646491891, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.02(1.03), norm=3.4931365920353747, lr=0.000173138985659022
2023-11-02 22:25:19   INFO  epoch: 22/30, acc_iter=29796, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:52, time_cost(all): 8:13:14/2:58:27, loss=0.356570967939208, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.23(1.03), norm=3.1389332822269713, lr=0.000171536044796854
2023-11-02 22:26:10   INFO  epoch: 22/30, acc_iter=29846, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:48, time_cost(all): 8:14:05/2:43:37, loss=0.356148289386526, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.19(1.03), norm=1.4312141162631737, lr=0.000169933103934686
2023-11-02 22:27:00   INFO  epoch: 22/30, acc_iter=29896, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:21, time_cost(all): 8:14:55/2:42:14, loss=0.355725610833844, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.95(1.03), norm=4.419042287259426, lr=0.000168330163072517
2023-11-02 22:27:50   INFO  epoch: 22/30, acc_iter=29946, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:59, time_cost(all): 8:15:45/2:49:21, loss=0.355302932281161, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.92(1.03), norm=3.174028363168955, lr=0.000166727222210349
2023-11-02 22:28:41   INFO  epoch: 22/30, acc_iter=29996, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:34, time_cost(all): 8:16:36/2:46:21, loss=0.354880253728479, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.9(1.03), norm=3.912013239427128, lr=0.00016512428134818
2023-11-02 22:29:31   INFO  epoch: 22/30, acc_iter=30046, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:18, time_cost(all): 8:17:26/2:41:13, loss=0.354457575175797, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.01(1.03), norm=4.94261962309373, lr=0.000163521340486012
2023-11-02 22:30:21   INFO  epoch: 22/30, acc_iter=30096, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:28, time_cost(all): 8:18:16/2:45:11, loss=0.354034896623114, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.2(1.03), norm=1.8107487560888793, lr=0.000161918399623843
2023-11-02 22:31:12   INFO  epoch: 22/30, acc_iter=30146, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:47, time_cost(all): 8:19:07/2:46:48, loss=0.353612218070432, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.96(1.03), norm=4.682426625321727, lr=0.000160315458761675
2023-11-02 22:32:02   INFO  epoch: 22/30, acc_iter=30196, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:53, time_cost(all): 8:19:57/2:50:15, loss=0.35318953951775, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.01(1.03), norm=3.424969707759137, lr=0.000158712517899506
2023-11-02 22:32:52   INFO  epoch: 22/30, acc_iter=30246, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:05, time_cost(all): 8:20:47/2:40:23, loss=0.352766860965068, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.05(1.03), norm=2.329172618278321, lr=0.000157109577037338
2023-11-02 22:33:43   INFO  epoch: 22/30, acc_iter=30296, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 8:21:38/2:44:01, loss=0.352344182412385, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.03(1.03), norm=4.403598051360104, lr=0.00015550663617517
2023-11-02 22:34:33   INFO  epoch: 23/30, acc_iter=30364, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:19, time_cost(all): 8:22:28/2:48:33, loss=0.351769339580737, d_time=0.00(0.00), f_time=1.01(1.01), b_time=0.83(1.03), norm=0.6874884231798253, lr=0.00015332663660262
2023-11-02 22:35:23   INFO  epoch: 23/30, acc_iter=30414, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:34, time_cost(all): 8:23:18/2:45:32, loss=0.351346661028055, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.9(1.03), norm=3.754172820151524, lr=0.000151723695740452
2023-11-02 22:36:14   INFO  epoch: 23/30, acc_iter=30464, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:31, time_cost(all): 8:24:09/2:35:11, loss=0.350923982475373, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.21(1.03), norm=4.095778709284301, lr=0.000150120754878283
2023-11-02 22:37:04   INFO  epoch: 23/30, acc_iter=30514, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:17, time_cost(all): 8:24:59/2:44:44, loss=0.35050130392269, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.92(1.03), norm=4.079782287668947, lr=0.000148517814016115
2023-11-02 22:37:54   INFO  epoch: 23/30, acc_iter=30564, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:45, time_cost(all): 8:25:49/2:42:53, loss=0.350078625370008, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.92(1.03), norm=1.6682887272513818, lr=0.000146914873153946
2023-11-02 22:38:45   INFO  epoch: 23/30, acc_iter=30614, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:31, time_cost(all): 8:26:40/2:34:06, loss=0.349655946817326, d_time=0.00(0.00), f_time=1.08(1.01), b_time=0.91(1.03), norm=0.752812354549369, lr=0.000145311932291778
2023-11-02 22:39:35   INFO  epoch: 23/30, acc_iter=30664, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:54, time_cost(all): 8:27:30/2:40:27, loss=0.349233268264644, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.14(1.03), norm=1.0159862129349235, lr=0.00014370899142961
2023-11-02 22:40:25   INFO  epoch: 23/30, acc_iter=30714, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:48, time_cost(all): 8:28:20/2:36:21, loss=0.348810589711961, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.92(1.03), norm=2.1756069485892215, lr=0.000142106050567441
2023-11-02 22:41:16   INFO  epoch: 23/30, acc_iter=30764, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:59, time_cost(all): 8:29:11/2:28:23, loss=0.348387911159279, d_time=0.00(0.00), f_time=1.18(1.01), b_time=0.85(1.03), norm=2.1883437274339914, lr=0.000140503109705273
2023-11-02 22:42:06   INFO  epoch: 23/30, acc_iter=30814, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:40, time_cost(all): 8:30:01/2:36:59, loss=0.347965232606597, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.03(1.03), norm=1.2069858381119887, lr=0.000138900168843104
2023-11-02 22:42:56   INFO  epoch: 23/30, acc_iter=30864, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:28, time_cost(all): 8:30:51/2:29:57, loss=0.347542554053914, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.01(1.03), norm=1.502653211584441, lr=0.000137297227980936
2023-11-02 22:43:47   INFO  epoch: 23/30, acc_iter=30914, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:25, time_cost(all): 8:31:42/2:30:29, loss=0.347119875501232, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.95(1.03), norm=2.5841517291137737, lr=0.000135694287118767
2023-11-02 22:44:37   INFO  epoch: 23/30, acc_iter=30964, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:06, time_cost(all): 8:32:32/2:23:23, loss=0.34669719694855, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.17(1.03), norm=2.691506184793894, lr=0.000134091346256599
2023-11-02 22:45:27   INFO  epoch: 23/30, acc_iter=31014, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:26, time_cost(all): 8:33:22/2:34:03, loss=0.346274518395867, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.98(1.03), norm=4.155718820370092, lr=0.00013248840539443
2023-11-02 22:46:18   INFO  epoch: 23/30, acc_iter=31064, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:56, time_cost(all): 8:34:13/2:35:19, loss=0.345851839843185, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.94(1.03), norm=1.5144950363081016, lr=0.000130885464532262
2023-11-02 22:47:08   INFO  epoch: 23/30, acc_iter=31114, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:18, time_cost(all): 8:35:03/2:26:41, loss=0.345429161290503, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.01(1.03), norm=3.4942079338086263, lr=0.000129282523670093
2023-11-02 22:47:58   INFO  epoch: 23/30, acc_iter=31164, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:39, time_cost(all): 8:35:53/2:23:34, loss=0.34500648273782, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.2(1.03), norm=3.8477111412112173, lr=0.000127679582807925
2023-11-02 22:48:49   INFO  epoch: 23/30, acc_iter=31214, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:07, time_cost(all): 8:36:44/2:32:11, loss=0.344583804185138, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.0(1.03), norm=4.663628481118419, lr=0.000126076641945757
2023-11-02 22:49:39   INFO  epoch: 23/30, acc_iter=31264, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:16, time_cost(all): 8:37:34/2:31:37, loss=0.344161125632456, d_time=0.00(0.00), f_time=0.95(1.01), b_time=0.84(1.03), norm=0.6129757525419179, lr=0.000124473701083588
2023-11-02 22:50:29   INFO  epoch: 23/30, acc_iter=31314, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:14, time_cost(all): 8:38:24/2:25:36, loss=0.343738447079774, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.93(1.03), norm=1.809456344555283, lr=0.00012287076022142
2023-11-02 22:51:20   INFO  epoch: 23/30, acc_iter=31364, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:32, time_cost(all): 8:39:15/2:24:13, loss=0.343315768527091, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.23(1.03), norm=3.5986911914112047, lr=0.000121267819359251
2023-11-02 22:52:10   INFO  epoch: 23/30, acc_iter=31414, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:45, time_cost(all): 8:40:05/2:25:16, loss=0.342893089974409, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.89(1.03), norm=4.354613439712586, lr=0.000119664878497083
2023-11-02 22:53:00   INFO  epoch: 23/30, acc_iter=31464, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:48, time_cost(all): 8:40:55/2:21:33, loss=0.342470411421727, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.86(1.03), norm=4.657577689460809, lr=0.000118061937634914
2023-11-02 22:53:51   INFO  epoch: 23/30, acc_iter=31514, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:59, time_cost(all): 8:41:46/2:24:52, loss=0.342047732869044, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.14(1.03), norm=1.9996460475689195, lr=0.000116458996772746
2023-11-02 22:54:41   INFO  epoch: 23/30, acc_iter=31564, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 8:42:36/2:18:37, loss=0.341625054316362, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.9(1.03), norm=1.1721768803120427, lr=0.000114856055910577
2023-11-02 22:55:31   INFO  epoch: 23/30, acc_iter=31614, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 8:43:26/2:22:17, loss=0.34120237576368, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.18(1.03), norm=1.7697210668689005, lr=0.000113253115048409
2023-11-02 22:56:22   INFO  epoch: 24/30, acc_iter=31682, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:20, time_cost(all): 8:44:17/2:26:01, loss=0.340627532932032, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.22(1.03), norm=4.274499547531722, lr=0.00011107311547586
2023-11-02 22:57:12   INFO  epoch: 24/30, acc_iter=31732, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:48, time_cost(all): 8:45:07/2:24:56, loss=0.34020485437935, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.05(1.03), norm=0.7078155908227448, lr=0.000109470174613691
2023-11-02 22:58:02   INFO  epoch: 24/30, acc_iter=31782, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:48, time_cost(all): 8:45:57/2:23:31, loss=0.339782175826667, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.04(1.03), norm=3.411398011028111, lr=0.000107867233751523
2023-11-02 22:58:53   INFO  epoch: 24/30, acc_iter=31832, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:19:37, time_cost(all): 8:46:48/2:11:44, loss=0.339359497273985, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.85(1.03), norm=2.323975612757058, lr=0.000106264292889354
2023-11-02 22:59:43   INFO  epoch: 24/30, acc_iter=31882, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:56, time_cost(all): 8:47:38/2:13:35, loss=0.338936818721303, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.12(1.03), norm=4.449326164653975, lr=0.000104661352027186
2023-11-02 23:00:33   INFO  epoch: 24/30, acc_iter=31932, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:57, time_cost(all): 8:48:28/2:15:07, loss=0.33851414016862, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.1(1.03), norm=3.0595459558752736, lr=0.000103058411165018
2023-11-02 23:01:24   INFO  epoch: 24/30, acc_iter=31982, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:10, time_cost(all): 8:49:19/2:11:47, loss=0.338091461615938, d_time=0.00(0.00), f_time=1.19(1.01), b_time=0.99(1.03), norm=2.258153410199894, lr=0.000101455470302849
2023-11-02 23:02:14   INFO  epoch: 24/30, acc_iter=32032, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:34, time_cost(all): 8:50:09/2:18:53, loss=0.337668783063256, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.92(1.03), norm=2.214589988287102, lr=9.9923011693296e-05
2023-11-02 23:03:04   INFO  epoch: 24/30, acc_iter=32082, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:37, time_cost(all): 8:50:59/2:14:35, loss=0.337246104510573, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.12(1.03), norm=4.329381604415399, lr=9.9086182272606e-05
2023-11-02 23:03:55   INFO  epoch: 24/30, acc_iter=32132, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:38, time_cost(all): 8:51:50/2:16:50, loss=0.336823425957891, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.03(1.03), norm=1.1857005672941239, lr=9.8249352851915e-05
2023-11-02 23:04:45   INFO  epoch: 24/30, acc_iter=32182, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:18, time_cost(all): 8:52:40/2:07:57, loss=0.336400747405209, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.03(1.03), norm=4.7360678857048955, lr=9.7412523431224e-05
2023-11-02 23:05:35   INFO  epoch: 24/30, acc_iter=32232, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:38, time_cost(all): 8:53:30/2:12:34, loss=0.335978068852526, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.99(1.03), norm=2.731371743555049, lr=9.6575694010533e-05
2023-11-02 23:06:26   INFO  epoch: 24/30, acc_iter=32282, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:43, time_cost(all): 8:54:21/2:13:28, loss=0.335555390299844, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.18(1.03), norm=1.3490505001965813, lr=9.5738864589842e-05
2023-11-02 23:07:16   INFO  epoch: 24/30, acc_iter=32332, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:08, time_cost(all): 8:55:11/2:11:33, loss=0.335132711747162, d_time=0.00(0.00), f_time=0.91(1.01), b_time=1.15(1.03), norm=4.99971826941126, lr=9.4902035169151e-05
2023-11-02 23:08:06   INFO  epoch: 24/30, acc_iter=32382, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:16, time_cost(all): 8:56:01/2:02:30, loss=0.33471003319448, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.22(1.03), norm=2.311451279626847, lr=9.406520574846e-05
2023-11-02 23:08:57   INFO  epoch: 24/30, acc_iter=32432, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:09:00, time_cost(all): 8:56:52/2:11:23, loss=0.334287354641797, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.03(1.03), norm=3.2615257454215714, lr=9.3228376327769e-05
2023-11-02 23:09:47   INFO  epoch: 24/30, acc_iter=32482, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:11, time_cost(all): 8:57:42/2:01:51, loss=0.333864676089115, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.12(1.03), norm=3.7129860389716645, lr=9.2391546907078e-05
2023-11-02 23:10:37   INFO  epoch: 24/30, acc_iter=32532, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:52, time_cost(all): 8:58:32/2:01:17, loss=0.333441997536433, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.04(1.03), norm=1.5220697301311679, lr=9.1554717486388e-05
2023-11-02 23:11:28   INFO  epoch: 24/30, acc_iter=32582, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:00, time_cost(all): 8:59:23/2:03:29, loss=0.33301931898375, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.22(1.03), norm=4.746763780929577, lr=9.0717888065697e-05
2023-11-02 23:12:18   INFO  epoch: 24/30, acc_iter=32632, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:24, time_cost(all): 9:00:13/2:07:06, loss=0.332596640431068, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.2(1.03), norm=2.8711537163916994, lr=8.9881058645006e-05
2023-11-02 23:13:08   INFO  epoch: 24/30, acc_iter=32682, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:25, time_cost(all): 9:01:03/2:06:30, loss=0.332173961878386, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.06(1.03), norm=1.2714599380444982, lr=8.9044229224315e-05
2023-11-02 23:13:59   INFO  epoch: 24/30, acc_iter=32732, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:37, time_cost(all): 9:01:54/1:57:10, loss=0.331751283325703, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.09(1.03), norm=2.474893513804762, lr=8.8207399803624e-05
2023-11-02 23:14:49   INFO  epoch: 24/30, acc_iter=32782, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:46, time_cost(all): 9:02:44/2:06:37, loss=0.331328604773021, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.84(1.03), norm=4.692658564123773, lr=8.7370570382933e-05
2023-11-02 23:15:39   INFO  epoch: 24/30, acc_iter=32832, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:54, time_cost(all): 9:03:34/1:55:11, loss=0.330905926220339, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.08(1.03), norm=3.320763877745508, lr=8.6533740962242e-05
2023-11-02 23:16:30   INFO  epoch: 24/30, acc_iter=32882, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 9:04:25/1:59:47, loss=0.330483247667657, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.99(1.03), norm=1.2286323162823707, lr=8.5696911541551e-05
2023-11-02 23:17:20   INFO  epoch: 24/30, acc_iter=32932, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 9:05:15/1:53:28, loss=0.330060569114974, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.1(1.03), norm=1.9268077996159774, lr=8.486008212086e-05
2023-11-02 23:18:10   INFO  epoch: 25/30, acc_iter=33000, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:04, time_cost(all): 9:06:05/1:59:48, loss=0.329485726283326, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.88(1.03), norm=0.70613755476325, lr=8.3721994108721e-05
2023-11-02 23:19:01   INFO  epoch: 25/30, acc_iter=33050, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:09, time_cost(all): 9:06:56/1:59:55, loss=0.329063047730644, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.95(1.03), norm=2.33921956434588, lr=8.288516468803e-05
2023-11-02 23:19:51   INFO  epoch: 25/30, acc_iter=33100, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:15, time_cost(all): 9:07:46/1:52:12, loss=0.328640369177962, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.89(1.03), norm=0.7863253133071175, lr=8.2048335267339e-05
2023-11-02 23:20:41   INFO  epoch: 25/30, acc_iter=33150, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:54, time_cost(all): 9:08:36/1:52:18, loss=0.328217690625279, d_time=0.00(0.00), f_time=0.94(1.01), b_time=1.22(1.03), norm=1.9645265567523875, lr=8.1211505846648e-05
2023-11-02 23:21:32   INFO  epoch: 25/30, acc_iter=33200, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:29, time_cost(all): 9:09:27/1:52:21, loss=0.327795012072597, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.0(1.03), norm=3.8684028785893325, lr=8.0374676425957e-05
2023-11-02 23:22:22   INFO  epoch: 25/30, acc_iter=33250, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:43, time_cost(all): 9:10:17/1:48:31, loss=0.327372333519915, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.03(1.03), norm=2.5542105041486236, lr=7.9537847005266e-05
2023-11-02 23:23:12   INFO  epoch: 25/30, acc_iter=33300, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:28, time_cost(all): 9:11:07/1:51:41, loss=0.326949654967232, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.06(1.03), norm=3.278370310522591, lr=7.8701017584576e-05
2023-11-02 23:24:03   INFO  epoch: 25/30, acc_iter=33350, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:16:00, time_cost(all): 9:11:58/1:51:23, loss=0.32652697641455, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.87(1.03), norm=2.180350091300099, lr=7.7864188163885e-05
2023-11-02 23:24:53   INFO  epoch: 25/30, acc_iter=33400, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:32, time_cost(all): 9:12:48/1:46:34, loss=0.326104297861868, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.91(1.03), norm=0.9233413964794397, lr=7.7027358743194e-05
2023-11-02 23:25:43   INFO  epoch: 25/30, acc_iter=33450, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:42, time_cost(all): 9:13:38/1:44:35, loss=0.325681619309186, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.87(1.03), norm=1.7189524542871375, lr=7.6190529322503e-05
2023-11-02 23:26:33   INFO  epoch: 25/30, acc_iter=33500, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:19, time_cost(all): 9:14:28/1:47:29, loss=0.325258940756503, d_time=0.00(0.00), f_time=1.15(1.01), b_time=1.03(1.03), norm=3.6382285873837166, lr=7.5353699901812e-05
2023-11-02 23:27:24   INFO  epoch: 25/30, acc_iter=33550, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:05, time_cost(all): 9:15:19/1:47:42, loss=0.324836262203821, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.05(1.03), norm=4.492910647642531, lr=7.4516870481121e-05
2023-11-02 23:28:14   INFO  epoch: 25/30, acc_iter=33600, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:29, time_cost(all): 9:16:09/1:47:54, loss=0.324413583651139, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.03(1.03), norm=0.7561292994719877, lr=7.368004106043e-05
2023-11-02 23:29:04   INFO  epoch: 25/30, acc_iter=33650, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:02, time_cost(all): 9:16:59/1:44:57, loss=0.323990905098456, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.91(1.03), norm=1.1297889743586993, lr=7.2843211639739e-05
2023-11-02 23:29:55   INFO  epoch: 25/30, acc_iter=33700, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:24, time_cost(all): 9:17:50/1:49:37, loss=0.323568226545774, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.1(1.03), norm=2.786543408785857, lr=7.2006382219048e-05
2023-11-02 23:30:45   INFO  epoch: 25/30, acc_iter=33750, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:15, time_cost(all): 9:18:40/1:47:50, loss=0.323145547993092, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.2(1.03), norm=3.7017492849551417, lr=7.1169552798358e-05
2023-11-02 23:31:35   INFO  epoch: 25/30, acc_iter=33800, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:43, time_cost(all): 9:19:30/1:45:07, loss=0.322722869440409, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.14(1.03), norm=3.725975919578279, lr=7.0332723377667e-05
2023-11-02 23:32:26   INFO  epoch: 25/30, acc_iter=33850, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:03, time_cost(all): 9:20:21/1:39:23, loss=0.322300190887727, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.07(1.03), norm=2.636574920314504, lr=6.9495893956976e-05
2023-11-02 23:33:16   INFO  epoch: 25/30, acc_iter=33900, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:14, time_cost(all): 9:21:11/1:45:58, loss=0.321877512335045, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.86(1.03), norm=3.910018703431797, lr=6.8659064536285e-05
2023-11-02 23:34:06   INFO  epoch: 25/30, acc_iter=33950, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:19, time_cost(all): 9:22:01/1:40:58, loss=0.321454833782363, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.17(1.03), norm=4.545040827578212, lr=6.7822235115594e-05
2023-11-02 23:34:57   INFO  epoch: 25/30, acc_iter=34000, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:22, time_cost(all): 9:22:52/1:45:12, loss=0.32103215522968, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.06(1.03), norm=2.879199743356596, lr=6.6985405694903e-05
2023-11-02 23:35:47   INFO  epoch: 25/30, acc_iter=34050, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:48, time_cost(all): 9:23:42/1:42:40, loss=0.320609476676998, d_time=0.00(0.00), f_time=0.93(1.01), b_time=1.0(1.03), norm=3.6807930492209953, lr=6.6148576274212e-05
2023-11-02 23:36:37   INFO  epoch: 25/30, acc_iter=34100, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:56, time_cost(all): 9:24:32/1:39:35, loss=0.320186798124316, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.94(1.03), norm=1.2871415073468746, lr=6.5311746853521e-05
2023-11-02 23:37:28   INFO  epoch: 25/30, acc_iter=34150, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:56, time_cost(all): 9:25:23/1:34:42, loss=0.319764119571633, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.22(1.03), norm=1.0191146302030933, lr=6.447491743283e-05
2023-11-02 23:38:18   INFO  epoch: 25/30, acc_iter=34200, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:07, time_cost(all): 9:26:13/1:36:03, loss=0.319341441018951, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.96(1.03), norm=2.459869353383957, lr=6.363808801214e-05
2023-11-02 23:39:08   INFO  epoch: 25/30, acc_iter=34250, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 9:27:03/1:39:43, loss=0.318918762466269, d_time=0.00(0.00), f_time=1.18(1.01), b_time=1.04(1.03), norm=1.6510122536641403, lr=6.2801258591449e-05
2023-11-02 23:39:59   INFO  epoch: 26/30, acc_iter=34318, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:20:57, time_cost(all): 9:27:54/1:31:13, loss=0.318343919634621, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.03(1.03), norm=3.2141178763651848, lr=6.1663170579309e-05
2023-11-02 23:40:49   INFO  epoch: 26/30, acc_iter=34368, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:20:43, time_cost(all): 9:28:44/1:33:44, loss=0.317921241081939, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.87(1.03), norm=1.6695923085351254, lr=6.0826341158618e-05
2023-11-02 23:41:39   INFO  epoch: 26/30, acc_iter=34418, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:20:01, time_cost(all): 9:29:34/1:31:26, loss=0.317498562529256, d_time=0.00(0.00), f_time=1.12(1.01), b_time=0.84(1.03), norm=3.142678793094907, lr=5.9989511737927e-05
2023-11-02 23:42:30   INFO  epoch: 26/30, acc_iter=34468, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:32, time_cost(all): 9:30:25/1:31:52, loss=0.317075883976574, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.97(1.03), norm=1.1100165151852803, lr=5.9152682317236e-05
2023-11-02 23:43:20   INFO  epoch: 26/30, acc_iter=34518, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:46, time_cost(all): 9:31:15/1:31:37, loss=0.316653205423892, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.05(1.03), norm=3.3222946575200347, lr=5.8315852896546e-05
2023-11-02 23:44:10   INFO  epoch: 26/30, acc_iter=34568, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:16:31, time_cost(all): 9:32:05/1:30:12, loss=0.316230526871209, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.16(1.03), norm=3.916822463127, lr=5.7479023475855e-05
2023-11-02 23:45:01   INFO  epoch: 26/30, acc_iter=34618, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:11, time_cost(all): 9:32:56/1:26:39, loss=0.315807848318527, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.07(1.03), norm=4.309579163005331, lr=5.6642194055164e-05
2023-11-02 23:45:51   INFO  epoch: 26/30, acc_iter=34668, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:17, time_cost(all): 9:33:46/1:25:13, loss=0.315385169765845, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.2(1.03), norm=3.412292969303516, lr=5.5805364634473e-05
2023-11-02 23:46:41   INFO  epoch: 26/30, acc_iter=34718, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:02, time_cost(all): 9:34:36/1:26:13, loss=0.314962491213162, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.08(1.03), norm=1.7084341257800841, lr=5.4968535213782e-05
2023-11-02 23:47:32   INFO  epoch: 26/30, acc_iter=34768, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:36, time_cost(all): 9:35:27/1:31:21, loss=0.31453981266048, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.04(1.03), norm=4.695514384045852, lr=5.4131705793091e-05
2023-11-02 23:48:22   INFO  epoch: 26/30, acc_iter=34818, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:59, time_cost(all): 9:36:17/1:23:27, loss=0.314117134107798, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.96(1.03), norm=2.9382700494987404, lr=5.32948763724e-05
2023-11-02 23:49:12   INFO  epoch: 26/30, acc_iter=34868, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:11:30, time_cost(all): 9:37:07/1:25:43, loss=0.313694455555115, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.11(1.03), norm=4.190035764679381, lr=5.2458046951709e-05
2023-11-02 23:50:03   INFO  epoch: 26/30, acc_iter=34918, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:42, time_cost(all): 9:37:58/1:28:50, loss=0.313271777002433, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.12(1.03), norm=3.717237581580545, lr=5.1621217531018e-05
2023-11-02 23:50:53   INFO  epoch: 26/30, acc_iter=34968, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:20, time_cost(all): 9:38:48/1:27:49, loss=0.312849098449751, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.01(1.03), norm=1.5794797566206533, lr=5.0784388110328e-05
2023-11-02 23:51:43   INFO  epoch: 26/30, acc_iter=35018, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:25, time_cost(all): 9:39:38/1:24:55, loss=0.312426419897069, d_time=0.00(0.00), f_time=1.13(1.01), b_time=0.94(1.03), norm=2.296914690479488, lr=4.9947558689637e-05
2023-11-02 23:52:34   INFO  epoch: 26/30, acc_iter=35068, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:09:06, time_cost(all): 9:40:29/1:20:40, loss=0.312003741344386, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.02(1.03), norm=0.5471353340469916, lr=4.9110729268946e-05
2023-11-02 23:53:24   INFO  epoch: 26/30, acc_iter=35118, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:01, time_cost(all): 9:41:19/1:18:27, loss=0.311581062791704, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.1(1.03), norm=2.062360609698176, lr=4.8273899848255e-05
2023-11-02 23:54:14   INFO  epoch: 26/30, acc_iter=35168, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:56, time_cost(all): 9:42:09/1:22:43, loss=0.311158384239022, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.04(1.03), norm=3.447106773715943, lr=4.7437070427564e-05
2023-11-02 23:55:05   INFO  epoch: 26/30, acc_iter=35218, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:06, time_cost(all): 9:43:00/1:23:18, loss=0.310735705686339, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.87(1.03), norm=0.9606217304948415, lr=4.6600241006873e-05
2023-11-02 23:55:55   INFO  epoch: 26/30, acc_iter=35268, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:13, time_cost(all): 9:43:50/1:18:23, loss=0.310313027133657, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.99(1.03), norm=4.462808419260611, lr=4.5763411586182e-05
2023-11-02 23:56:45   INFO  epoch: 26/30, acc_iter=35318, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:40, time_cost(all): 9:44:40/1:16:48, loss=0.309890348580975, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.09(1.03), norm=2.2353989633886355, lr=4.4926582165491e-05
2023-11-02 23:57:36   INFO  epoch: 26/30, acc_iter=35368, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:34, time_cost(all): 9:45:31/1:19:29, loss=0.309467670028293, d_time=0.00(0.00), f_time=1.06(1.01), b_time=0.89(1.03), norm=4.281246235057995, lr=4.40897527448e-05
2023-11-02 23:58:26   INFO  epoch: 26/30, acc_iter=35418, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:53, time_cost(all): 9:46:21/1:18:24, loss=0.30904499147561, d_time=0.00(0.00), f_time=1.09(1.01), b_time=0.9(1.03), norm=4.029104368376398, lr=4.325292332411e-05
2023-11-02 23:59:16   INFO  epoch: 26/30, acc_iter=35468, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:02, time_cost(all): 9:47:11/1:18:28, loss=0.308622312922928, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.84(1.03), norm=2.4091403454060343, lr=4.2416093903419e-05
2023-11-03 00:00:07   INFO  epoch: 26/30, acc_iter=35518, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:10, time_cost(all): 9:48:02/1:13:28, loss=0.308199634370246, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.09(1.03), norm=1.06382962265557, lr=4.1579264482728e-05
2023-11-03 00:00:57   INFO  epoch: 26/30, acc_iter=35568, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 9:48:52/1:14:55, loss=0.307776955817563, d_time=0.00(0.00), f_time=1.21(1.01), b_time=1.12(1.03), norm=4.0347378454594605, lr=4.0742435062037e-05
2023-11-03 00:01:47   INFO  epoch: 27/30, acc_iter=35636, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:22:08, time_cost(all): 9:49:42/1:10:27, loss=0.307202112985915, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.18(1.03), norm=4.830477705131511, lr=3.9604347049897e-05
2023-11-03 00:02:38   INFO  epoch: 27/30, acc_iter=35686, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:30, time_cost(all): 9:50:33/1:13:01, loss=0.306779434433233, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.08(1.03), norm=3.191940651682773, lr=3.8767517629206e-05
2023-11-03 00:03:28   INFO  epoch: 27/30, acc_iter=35736, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:30, time_cost(all): 9:51:23/1:11:33, loss=0.306356755880551, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.92(1.03), norm=1.377786096796988, lr=3.7930688208516e-05
2023-11-03 00:04:18   INFO  epoch: 27/30, acc_iter=35786, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:21, time_cost(all): 9:52:13/1:10:53, loss=0.305934077327868, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.1(1.03), norm=3.1648876537450237, lr=3.7093858787825e-05
2023-11-03 00:05:09   INFO  epoch: 27/30, acc_iter=35836, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:17:32, time_cost(all): 9:53:04/1:10:04, loss=0.305511398775186, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.17(1.03), norm=1.4574235734974321, lr=3.6257029367134e-05
2023-11-03 00:05:59   INFO  epoch: 27/30, acc_iter=35886, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:30, time_cost(all): 9:53:54/1:06:31, loss=0.305088720222504, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.02(1.03), norm=3.796066706504713, lr=3.5420199946443e-05
2023-11-03 00:06:49   INFO  epoch: 27/30, acc_iter=35936, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:15, time_cost(all): 9:54:44/1:09:05, loss=0.304666041669822, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.0(1.03), norm=3.0667304403639024, lr=3.4583370525752e-05
2023-11-03 00:07:40   INFO  epoch: 27/30, acc_iter=35986, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:15:32, time_cost(all): 9:55:35/1:07:36, loss=0.304243363117139, d_time=0.00(0.00), f_time=1.1(1.01), b_time=0.89(1.03), norm=3.9493147182881283, lr=3.3746541105061e-05
2023-11-03 00:08:30   INFO  epoch: 27/30, acc_iter=36036, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:21, time_cost(all): 9:56:25/1:03:50, loss=0.303820684564457, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.22(1.03), norm=0.7010174907062148, lr=3.290971168437e-05
2023-11-03 00:09:20   INFO  epoch: 27/30, acc_iter=36086, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:06, time_cost(all): 9:57:15/1:03:13, loss=0.303398006011775, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.97(1.03), norm=3.016576164118195, lr=3.2072882263679e-05
2023-11-03 00:10:11   INFO  epoch: 27/30, acc_iter=36136, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:13:16, time_cost(all): 9:58:06/1:04:21, loss=0.302975327459092, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.0(1.03), norm=4.697042923672562, lr=3.1236052842988e-05
2023-11-03 00:11:01   INFO  epoch: 27/30, acc_iter=36186, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:21, time_cost(all): 9:58:56/1:03:34, loss=0.30255264890641, d_time=0.00(0.00), f_time=1.02(1.01), b_time=0.83(1.03), norm=3.6553338479382105, lr=3.0399223422298e-05
2023-11-03 00:11:51   INFO  epoch: 27/30, acc_iter=36236, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:10:46, time_cost(all): 9:59:46/1:05:56, loss=0.302129970353728, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.16(1.03), norm=3.128737465590299, lr=2.9562394001607e-05
2023-11-03 00:12:42   INFO  epoch: 27/30, acc_iter=36286, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:03, time_cost(all): 10:00:37/1:04:56, loss=0.301707291801045, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.02(1.03), norm=2.117844201348901, lr=2.8725564580916e-05
2023-11-03 00:13:32   INFO  epoch: 27/30, acc_iter=36336, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:13, time_cost(all): 10:01:27/1:00:37, loss=0.301284613248363, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.18(1.03), norm=4.273943561242315, lr=2.7888735160225e-05
2023-11-03 00:14:22   INFO  epoch: 27/30, acc_iter=36386, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:17, time_cost(all): 10:02:17/1:02:50, loss=0.300861934695681, d_time=0.00(0.00), f_time=1.14(1.01), b_time=1.0(1.03), norm=0.88874832905801, lr=2.7051905739534e-05
2023-11-03 00:15:13   INFO  epoch: 27/30, acc_iter=36436, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:28, time_cost(all): 10:03:08/1:00:56, loss=0.300439256142998, d_time=0.00(0.00), f_time=1.0(1.01), b_time=0.88(1.03), norm=3.3251825165607944, lr=2.6215076318843e-05
2023-11-03 00:16:03   INFO  epoch: 27/30, acc_iter=36486, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:16, time_cost(all): 10:03:58/0:59:53, loss=0.300016577590316, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.05(1.03), norm=4.647601243386716, lr=2.5378246898152e-05
2023-11-03 00:16:53   INFO  epoch: 27/30, acc_iter=36536, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:05:55, time_cost(all): 10:04:48/0:58:06, loss=0.299593899037634, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.04(1.03), norm=3.0050520367945013, lr=2.4541417477461e-05
2023-11-03 00:17:44   INFO  epoch: 27/30, acc_iter=36586, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:08, time_cost(all): 10:05:39/0:56:24, loss=0.299171220484952, d_time=0.00(0.00), f_time=0.97(1.01), b_time=0.92(1.03), norm=1.1647044437574416, lr=2.370458805677e-05
2023-11-03 00:18:34   INFO  epoch: 27/30, acc_iter=36636, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:37, time_cost(all): 10:06:29/0:59:17, loss=0.298748541932269, d_time=0.00(0.00), f_time=1.02(1.01), b_time=1.12(1.03), norm=1.5191364918939474, lr=2.286775863608e-05
2023-11-03 00:19:24   INFO  epoch: 27/30, acc_iter=36686, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:35, time_cost(all): 10:07:19/0:54:45, loss=0.298325863379587, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.15(1.03), norm=1.6664826726025952, lr=2.2030929215389e-05
2023-11-03 00:20:15   INFO  epoch: 27/30, acc_iter=36736, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:46, time_cost(all): 10:08:10/0:53:25, loss=0.297903184826905, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.13(1.03), norm=3.2555866391019057, lr=2.1194099794698e-05
2023-11-03 00:21:05   INFO  epoch: 27/30, acc_iter=36786, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:01, time_cost(all): 10:09:00/0:54:57, loss=0.297480506274222, d_time=0.00(0.00), f_time=1.04(1.01), b_time=1.13(1.03), norm=2.1415527353142454, lr=2.0357270374007e-05
2023-11-03 00:21:55   INFO  epoch: 27/30, acc_iter=36836, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:06, time_cost(all): 10:09:50/0:52:21, loss=0.29705782772154, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.05(1.03), norm=0.6821055631390573, lr=1.9520440953316e-05
2023-11-03 00:22:46   INFO  epoch: 27/30, acc_iter=36886, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:18, time_cost(all): 10:10:41/0:52:44, loss=0.296635149168858, d_time=0.00(0.00), f_time=1.15(1.01), b_time=0.92(1.03), norm=0.5716288688518165, lr=1.8683611532625e-05
2023-11-03 00:23:36   INFO  epoch: 28/30, acc_iter=36954, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:16, time_cost(all): 10:11:31/0:50:25, loss=0.29606030633721, d_time=0.00(0.00), f_time=1.03(1.01), b_time=1.12(1.03), norm=4.189350509522765, lr=1.7545523520486e-05
2023-11-03 00:24:26   INFO  epoch: 28/30, acc_iter=37004, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:19:56, time_cost(all): 10:12:21/0:48:59, loss=0.295637627784528, d_time=0.00(0.00), f_time=0.91(1.01), b_time=1.13(1.03), norm=4.705659449432259, lr=1.6708694099795e-05
2023-11-03 00:25:17   INFO  epoch: 28/30, acc_iter=37054, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:19:15, time_cost(all): 10:13:12/0:52:16, loss=0.295214949231845, d_time=0.00(0.00), f_time=1.05(1.01), b_time=0.93(1.03), norm=3.6318995889165584, lr=1.5871864679104e-05
2023-11-03 00:26:07   INFO  epoch: 28/30, acc_iter=37104, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:18:43, time_cost(all): 10:14:02/0:49:51, loss=0.294792270679163, d_time=0.00(0.00), f_time=0.94(1.01), b_time=0.9(1.03), norm=1.8347342328206095, lr=1.5035035258413e-05
2023-11-03 00:26:57   INFO  epoch: 28/30, acc_iter=37154, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:08, time_cost(all): 10:14:52/0:47:16, loss=0.294369592126481, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.01(1.03), norm=4.993590998259228, lr=1.4198205837722e-05
2023-11-03 00:27:48   INFO  epoch: 28/30, acc_iter=37204, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:50, time_cost(all): 10:15:43/0:49:31, loss=0.293946913573798, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.83(1.03), norm=3.8022579132964447, lr=1.3361376417031e-05
2023-11-03 00:28:38   INFO  epoch: 28/30, acc_iter=37254, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:15:38, time_cost(all): 10:16:33/0:47:12, loss=0.293524235021116, d_time=0.00(0.00), f_time=1.09(1.01), b_time=1.08(1.03), norm=2.7035906536444596, lr=1.252454699634e-05
2023-11-03 00:29:28   INFO  epoch: 28/30, acc_iter=37304, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:52, time_cost(all): 10:17:23/0:44:34, loss=0.293101556468434, d_time=0.00(0.00), f_time=0.96(1.01), b_time=1.06(1.03), norm=1.6695740237865306, lr=1.1687717575649e-05
2023-11-03 00:30:19   INFO  epoch: 28/30, acc_iter=37354, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:27, time_cost(all): 10:18:14/0:45:56, loss=0.292678877915751, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.1(1.03), norm=4.288477890153921, lr=1.0850888154958e-05
2023-11-03 00:31:09   INFO  epoch: 28/30, acc_iter=37404, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:54, time_cost(all): 10:19:04/0:42:22, loss=0.292256199363069, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.15(1.03), norm=4.431607045454346, lr=1.0014058734268e-05
2023-11-03 00:31:59   INFO  epoch: 28/30, acc_iter=37454, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:22, time_cost(all): 10:19:54/0:41:47, loss=0.291833520810387, d_time=0.00(0.00), f_time=0.99(1.01), b_time=0.92(1.03), norm=1.9842516276951125, lr=9.769782667341e-06
2023-11-03 00:32:50   INFO  epoch: 28/30, acc_iter=37504, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:06, time_cost(all): 10:20:45/0:41:26, loss=0.291410842257704, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.22(1.03), norm=3.4975593817541153, lr=9.535631596695e-06
2023-11-03 00:33:40   INFO  epoch: 28/30, acc_iter=37554, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:07, time_cost(all): 10:21:35/0:42:34, loss=0.290988163705022, d_time=0.00(0.00), f_time=1.21(1.01), b_time=0.92(1.03), norm=0.8553274878953444, lr=9.30148052605e-06
2023-11-03 00:34:30   INFO  epoch: 28/30, acc_iter=37604, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:25, time_cost(all): 10:22:25/0:42:42, loss=0.29056548515234, d_time=0.00(0.00), f_time=1.11(1.01), b_time=1.03(1.03), norm=1.1898546161664616, lr=9.067329455404e-06
2023-11-03 00:35:21   INFO  epoch: 28/30, acc_iter=37654, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:40, time_cost(all): 10:23:16/0:41:04, loss=0.290142806599658, d_time=0.00(0.00), f_time=1.16(1.01), b_time=1.1(1.03), norm=2.7662982813415153, lr=8.833178384758e-06
2023-11-03 00:36:11   INFO  epoch: 28/30, acc_iter=37704, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:45, time_cost(all): 10:24:06/0:40:24, loss=0.289720128046975, d_time=0.00(0.00), f_time=1.12(1.01), b_time=1.1(1.03), norm=1.6705383125514977, lr=8.599027314112e-06
2023-11-03 00:37:01   INFO  epoch: 28/30, acc_iter=37754, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:07:29, time_cost(all): 10:24:56/0:40:01, loss=0.289297449494293, d_time=0.00(0.00), f_time=1.07(1.01), b_time=1.19(1.03), norm=2.3988635229878277, lr=8.364876243467e-06
2023-11-03 00:37:52   INFO  epoch: 28/30, acc_iter=37804, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:07:16, time_cost(all): 10:25:47/0:37:15, loss=0.288874770941611, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.99(1.03), norm=2.6267228457937426, lr=8.130725172821e-06
2023-11-03 00:38:42   INFO  epoch: 28/30, acc_iter=37854, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:05, time_cost(all): 10:26:37/0:36:00, loss=0.288452092388928, d_time=0.00(0.00), f_time=0.97(1.01), b_time=1.21(1.03), norm=4.227881107205635, lr=7.896574102175e-06
2023-11-03 00:39:32   INFO  epoch: 28/30, acc_iter=37904, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:35, time_cost(all): 10:27:27/0:34:40, loss=0.288029413836246, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.17(1.03), norm=4.185129686836104, lr=7.662423031529e-06
2023-11-03 00:40:23   INFO  epoch: 28/30, acc_iter=37954, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:37, time_cost(all): 10:28:18/0:35:19, loss=0.287606735283564, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.0(1.03), norm=2.0008518071686154, lr=7.428271960883e-06
2023-11-03 00:41:13   INFO  epoch: 28/30, acc_iter=38004, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:45, time_cost(all): 10:29:08/0:34:42, loss=0.287184056730881, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.03(1.03), norm=3.360455348393531, lr=7.194120890238e-06
2023-11-03 00:42:03   INFO  epoch: 28/30, acc_iter=38054, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:44, time_cost(all): 10:29:58/0:33:05, loss=0.286761378178199, d_time=0.00(0.00), f_time=1.08(1.01), b_time=1.01(1.03), norm=2.6696130084107015, lr=6.959969819592e-06
2023-11-03 00:42:54   INFO  epoch: 28/30, acc_iter=38104, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:01:53, time_cost(all): 10:30:49/0:32:58, loss=0.286338699625517, d_time=0.00(0.00), f_time=1.17(1.01), b_time=0.92(1.03), norm=4.411604148676204, lr=6.725818748946e-06
2023-11-03 00:43:44   INFO  epoch: 28/30, acc_iter=38154, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:09, time_cost(all): 10:31:39/0:31:15, loss=0.285916021072835, d_time=0.00(0.00), f_time=1.13(1.01), b_time=1.1(1.03), norm=2.2524690964476934, lr=6.4916676783e-06
2023-11-03 00:44:34   INFO  epoch: 28/30, acc_iter=38204, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 10:32:29/0:30:09, loss=0.285493342520152, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.09(1.03), norm=2.9561001384478405, lr=6.257516607655e-06
2023-11-03 00:45:25   INFO  epoch: 29/30, acc_iter=38272, cur_iter=50/1318, batch_size=24, time_cost(epoch): 0:00:50/0:21:02, time_cost(all): 10:33:20/0:29:52, loss=0.284918499688504, d_time=0.00(0.00), f_time=1.14(1.01), b_time=0.84(1.03), norm=2.242876156006072, lr=5.939071151576e-06
2023-11-03 00:46:15   INFO  epoch: 29/30, acc_iter=38322, cur_iter=100/1318, batch_size=24, time_cost(epoch): 0:01:40/0:21:14, time_cost(all): 10:34:10/0:28:23, loss=0.284495821135822, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.94(1.03), norm=4.489462195187323, lr=5.704920080931e-06
2023-11-03 00:47:05   INFO  epoch: 29/30, acc_iter=38372, cur_iter=150/1318, batch_size=24, time_cost(epoch): 0:02:30/0:18:43, time_cost(all): 10:35:00/0:28:51, loss=0.28407314258314, d_time=0.00(0.00), f_time=1.0(1.01), b_time=1.03(1.03), norm=3.059856616494973, lr=5.470769010285e-06
2023-11-03 00:47:56   INFO  epoch: 29/30, acc_iter=38422, cur_iter=200/1318, batch_size=24, time_cost(epoch): 0:03:21/0:17:56, time_cost(all): 10:35:51/0:26:39, loss=0.283650464030457, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.87(1.03), norm=4.255922016421242, lr=5.236617939639e-06
2023-11-03 00:48:46   INFO  epoch: 29/30, acc_iter=38472, cur_iter=250/1318, batch_size=24, time_cost(epoch): 0:04:11/0:18:41, time_cost(all): 10:36:41/0:26:52, loss=0.283227785477775, d_time=0.00(0.00), f_time=1.1(1.01), b_time=1.21(1.03), norm=2.7379498891999043, lr=5.002466868993e-06
2023-11-03 00:49:36   INFO  epoch: 29/30, acc_iter=38522, cur_iter=300/1318, batch_size=24, time_cost(epoch): 0:05:01/0:17:25, time_cost(all): 10:37:31/0:25:48, loss=0.282805106925093, d_time=0.00(0.00), f_time=1.2(1.01), b_time=0.85(1.03), norm=3.394659619752056, lr=4.768315798348e-06
2023-11-03 00:50:27   INFO  epoch: 29/30, acc_iter=38572, cur_iter=350/1318, batch_size=24, time_cost(epoch): 0:05:52/0:16:43, time_cost(all): 10:38:22/0:24:36, loss=0.282382428372411, d_time=0.00(0.00), f_time=1.04(1.01), b_time=0.91(1.03), norm=2.1024008898465594, lr=4.534164727702e-06
2023-11-03 00:51:17   INFO  epoch: 29/30, acc_iter=38622, cur_iter=400/1318, batch_size=24, time_cost(epoch): 0:06:42/0:14:58, time_cost(all): 10:39:12/0:24:02, loss=0.281959749819728, d_time=0.00(0.00), f_time=1.03(1.01), b_time=0.91(1.03), norm=3.4089721763546983, lr=4.300013657056e-06
2023-11-03 00:52:07   INFO  epoch: 29/30, acc_iter=38672, cur_iter=450/1318, batch_size=24, time_cost(epoch): 0:07:32/0:14:13, time_cost(all): 10:40:02/0:24:21, loss=0.281537071267046, d_time=0.00(0.00), f_time=1.16(1.01), b_time=0.88(1.03), norm=2.5618241121842127, lr=4.06586258641e-06
2023-11-03 00:52:58   INFO  epoch: 29/30, acc_iter=38722, cur_iter=500/1318, batch_size=24, time_cost(epoch): 0:08:23/0:13:32, time_cost(all): 10:40:53/0:22:01, loss=0.281114392714364, d_time=0.00(0.00), f_time=1.07(1.01), b_time=0.88(1.03), norm=2.2164837844435725, lr=3.831711515765e-06
2023-11-03 00:53:48   INFO  epoch: 29/30, acc_iter=38772, cur_iter=550/1318, batch_size=24, time_cost(epoch): 0:09:13/0:12:24, time_cost(all): 10:41:43/0:22:04, loss=0.280691714161681, d_time=0.00(0.00), f_time=0.91(1.01), b_time=0.87(1.03), norm=3.1108942705823095, lr=3.597560445119e-06
2023-11-03 00:54:38   INFO  epoch: 29/30, acc_iter=38822, cur_iter=600/1318, batch_size=24, time_cost(epoch): 0:10:03/0:12:02, time_cost(all): 10:42:33/0:21:37, loss=0.280269035608999, d_time=0.00(0.00), f_time=1.01(1.01), b_time=1.17(1.03), norm=2.217866486925996, lr=3.363409374473e-06
2023-11-03 00:55:29   INFO  epoch: 29/30, acc_iter=38872, cur_iter=650/1318, batch_size=24, time_cost(epoch): 0:10:54/0:11:29, time_cost(all): 10:43:24/0:19:21, loss=0.279846357056317, d_time=0.00(0.00), f_time=1.05(1.01), b_time=1.06(1.03), norm=2.9982872546212724, lr=3.129258303827e-06
2023-11-03 00:56:19   INFO  epoch: 29/30, acc_iter=38922, cur_iter=700/1318, batch_size=24, time_cost(epoch): 0:11:44/0:10:06, time_cost(all): 10:44:14/0:19:56, loss=0.279423678503634, d_time=0.00(0.00), f_time=0.92(1.01), b_time=0.85(1.03), norm=2.443935205835497, lr=2.895107233182e-06
2023-11-03 00:57:09   INFO  epoch: 29/30, acc_iter=38972, cur_iter=750/1318, batch_size=24, time_cost(epoch): 0:12:34/0:09:25, time_cost(all): 10:45:04/0:18:44, loss=0.279000999950952, d_time=0.00(0.00), f_time=0.99(1.01), b_time=1.01(1.03), norm=2.0819456330260433, lr=2.660956162536e-06
2023-11-03 00:58:00   INFO  epoch: 29/30, acc_iter=39022, cur_iter=800/1318, batch_size=24, time_cost(epoch): 0:13:25/0:08:33, time_cost(all): 10:45:55/0:18:05, loss=0.27857832139827, d_time=0.00(0.00), f_time=1.06(1.01), b_time=1.1(1.03), norm=2.300861957407129, lr=2.42680509189e-06
2023-11-03 00:58:50   INFO  epoch: 29/30, acc_iter=39072, cur_iter=850/1318, batch_size=24, time_cost(epoch): 0:14:15/0:08:09, time_cost(all): 10:46:45/0:16:36, loss=0.278155642845588, d_time=0.00(0.00), f_time=1.17(1.01), b_time=1.0(1.03), norm=2.2091023613708773, lr=2.192654021244e-06
2023-11-03 00:59:40   INFO  epoch: 29/30, acc_iter=39122, cur_iter=900/1318, batch_size=24, time_cost(epoch): 0:15:05/0:06:58, time_cost(all): 10:47:35/0:15:05, loss=0.277732964292905, d_time=0.00(0.00), f_time=0.92(1.01), b_time=1.02(1.03), norm=3.951767219622056, lr=1.958502950599e-06
2023-11-03 01:00:31   INFO  epoch: 29/30, acc_iter=39172, cur_iter=950/1318, batch_size=24, time_cost(epoch): 0:15:56/0:06:18, time_cost(all): 10:48:26/0:14:43, loss=0.277310285740223, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.04(1.03), norm=4.473699351825884, lr=1.724351879953e-06
2023-11-03 01:01:21   INFO  epoch: 29/30, acc_iter=39222, cur_iter=1000/1318, batch_size=24, time_cost(epoch): 0:16:46/0:05:31, time_cost(all): 10:49:16/0:14:30, loss=0.276887607187541, d_time=0.00(0.00), f_time=0.95(1.01), b_time=1.23(1.03), norm=1.375749435591609, lr=1.490200809307e-06
2023-11-03 01:02:11   INFO  epoch: 29/30, acc_iter=39272, cur_iter=1050/1318, batch_size=24, time_cost(epoch): 0:17:36/0:04:39, time_cost(all): 10:50:06/0:13:21, loss=0.276464928634858, d_time=0.00(0.00), f_time=0.93(1.01), b_time=0.96(1.03), norm=4.981940109192315, lr=1.256049738661e-06
2023-11-03 01:03:02   INFO  epoch: 29/30, acc_iter=39322, cur_iter=1100/1318, batch_size=24, time_cost(epoch): 0:18:27/0:03:34, time_cost(all): 10:50:57/0:11:53, loss=0.276042250082176, d_time=0.00(0.00), f_time=0.96(1.01), b_time=0.94(1.03), norm=3.8955337680079247, lr=1.021898668016e-06
2023-11-03 01:03:52   INFO  epoch: 29/30, acc_iter=39372, cur_iter=1150/1318, batch_size=24, time_cost(epoch): 0:19:17/0:02:50, time_cost(all): 10:51:47/0:11:56, loss=0.275619571529494, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.85(1.03), norm=4.699810021569387, lr=7.8774759737e-07
2023-11-03 01:04:42   INFO  epoch: 29/30, acc_iter=39422, cur_iter=1200/1318, batch_size=24, time_cost(epoch): 0:20:07/0:02:02, time_cost(all): 10:52:37/0:10:21, loss=0.275196892976811, d_time=0.00(0.00), f_time=1.19(1.01), b_time=1.19(1.03), norm=4.798323107722345, lr=5.53596526724e-07
2023-11-03 01:05:33   INFO  epoch: 29/30, acc_iter=39472, cur_iter=1250/1318, batch_size=24, time_cost(epoch): 0:20:58/0:01:10, time_cost(all): 10:53:28/0:10:09, loss=0.274774214424129, d_time=0.00(0.00), f_time=1.11(1.01), b_time=0.89(1.03), norm=3.9123283957305537, lr=3.19445456078e-07
2023-11-03 01:06:23   INFO  epoch: 29/30, acc_iter=39522, cur_iter=1300/1318, batch_size=24, time_cost(epoch): 0:21:48/0:00:17, time_cost(all): 10:54:18/0:09:01, loss=0.274351535871447, d_time=0.00(0.00), f_time=0.98(1.01), b_time=1.12(1.03), norm=0.5104616922562847, lr=8.5294385432e-08
2023-11-03 01:06:23   INFO  **********************End training picture_models/picture_waymo_ssl_seal_decoder_mask_0.2(offline_30e)**********************