{
 "cells": [
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Benchmarking Self-supervised Vision Transformers in Astronomy\n",
    "This is a demo using to evaluate our fine-tuned C-MAE models.\n",
    "\n",
    "## Import packages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\u001b[32m[05/16 11:04:11 detectron2]: \u001b[0mRank of current process: 0. World size: 1\n",
      "\u001b[32m[05/16 11:04:13 detectron2]: \u001b[0mEnvironment info:\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "sys.platform                     linux\n",
      "Python                           3.8.10 (default, Apr 16 2024, 18:43:55) [GCC 7.5.0]\n",
      "numpy                            1.24.4\n",
      "detectron2                       0.6 @/root/venv_ObjectDetect/ViT-R-CNN/detectron2/detectron2\n",
      "Compiler                         GCC 7.5\n",
      "CUDA compiler                    CUDA 11.4\n",
      "detectron2 arch flags            8.6\n",
      "DETECTRON2_ENV_MODULE            <not set>\n",
      "PyTorch                          1.12.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torch\n",
      "PyTorch debug build              False\n",
      "torch._C._GLIBCXX_USE_CXX11_ABI  False\n",
      "GPU available                    Yes\n",
      "GPU 0,1,2,3,4,5,6,7              NVIDIA A40 (arch=8.6)\n",
      "Driver version                   470.182.03\n",
      "CUDA_HOME                        /usr/local/cuda-11.4\n",
      "Pillow                           10.3.0\n",
      "torchvision                      0.13.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torchvision\n",
      "torchvision arch flags           3.5, 5.0, 6.0, 7.0, 7.5, 8.0, 8.6\n",
      "fvcore                           0.1.5.post20221221\n",
      "iopath                           0.1.9\n",
      "cv2                              4.9.0\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "PyTorch built with:\n",
      "  - GCC 9.3\n",
      "  - C++ Version: 201402\n",
      "  - Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications\n",
      "  - Intel(R) MKL-DNN v2.6.0 (Git Hash 52b5f107dd9cf10910aaa19cb47f3abf9b349815)\n",
      "  - OpenMP 201511 (a.k.a. OpenMP 4.5)\n",
      "  - LAPACK is enabled (usually provided by MKL)\n",
      "  - NNPACK is enabled\n",
      "  - CPU capability usage: AVX2\n",
      "  - CUDA Runtime 11.3\n",
      "  - NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70;-gencode;arch=compute_75,code=sm_75;-gencode;arch=compute_80,code=sm_80;-gencode;arch=compute_86,code=sm_86\n",
      "  - CuDNN 8.3.2  (built against CUDA 11.5)\n",
      "  - Magma 2.5.2\n",
      "  - Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=11.3, CUDNN_VERSION=8.3.2, CXX_COMPILER=/opt/rh/devtoolset-9/root/usr/bin/c++, CXX_FLAGS= -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -DSYMBOLICATE_MOBILE_DEBUG_HANDLE -DEDGE_PROFILER_USE_KINETO -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wno-unused-parameter -Wno-unused-function -Wno-unused-result -Wno-unused-local-typedefs -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Werror=cast-function-type -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.12.0, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=OFF, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, USE_ROCM=OFF, \n",
      "\n",
      "\u001b[32m[05/16 11:04:13 detectron2]: \u001b[0mCommand line arguments: Namespace(config_file='./configs/mask_rcnn_vit_b.py', dist_url='tcp://127.0.0.1:49152', eval_only=True, machine_rank=0, num_gpus=1, num_machines=1, opts=[], resume=False)\n",
      "\u001b[32m[05/16 11:04:13 detectron2]: \u001b[0mContents of args.config_file=./configs/mask_rcnn_vit_b.py:\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mfunctools\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mfvcore\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mcommon\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mparam_scheduler\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mMultiStepParamScheduler\u001b[39m\n",
      "\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmodel_zoo\u001b[39m\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mconfig\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mLazyCall\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mas\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mL\u001b[39m\n",
      "\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mdata\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mtransforms\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mas\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mT\u001b[39m\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15msolver\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mWarmupParamScheduler\u001b[39m\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mmodeling\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mvit\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mdetectron2\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mdata\u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mdatasets\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mregister_coco_instances\u001b[39m\n",
      "\n",
      "\u001b[38;5;245m# dataset\u001b[39m\n",
      "\u001b[38;5;15mregister_coco_instances\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mneuralens_train\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m{\u001b[39m\u001b[38;5;15m}\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m/root/DataSet/Neurlens/annotations/instances_train.json\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m/root/DataSet/Neurlens/train/\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15mregister_coco_instances\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mneuralens_val\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m{\u001b[39m\u001b[38;5;15m}\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m/root/DataSet/Neurlens/annotations/instances_val.json\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m/root/DataSet/Neurlens/val/\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m512\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmodel_zoo\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mget_config\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mcommon/data/coco.py\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdataloader\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdataset\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnames\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mneuralens_train\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmapper\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15maugmentations\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m[\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mT\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mRandomFlip\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mhorizontal\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;81mTrue\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m  \u001b[39m\u001b[38;5;245m# flip first\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mT\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mResizeScale\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m        \u001b[39m\u001b[38;5;15mmin_scale\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m0.1\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmax_scale\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m2.0\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mtarget_height\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mtarget_width\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mimage_size\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mT\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mFixedSizeCrop\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mcrop_size\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpad\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;81mFalse\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m]\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmapper\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mimage_format\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mRGB\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtotal_batch_size\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m64\u001b[39m\n",
      "\u001b[38;5;245m# recompute boxes due to cropping\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmapper\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mrecompute_boxes\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmapper\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15muse_instance_mask\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtest\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdataset\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnames\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mneuralens_val\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtest\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmapper\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15maugmentations\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m[\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mT\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mResizeShortestEdge\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mshort_edge_length\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmax_size\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mimage_size\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m]\u001b[39m\n",
      "\n",
      "\n",
      "\u001b[38;5;245m# model\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmodel_zoo\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mget_config\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mcommon/models/mask_rcnn_vitdet.py\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmodel\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdrop_path_rate\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.1\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mimg_size\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mimage_size\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15msquare_pad\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mimage_size\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mroi_heads\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnum_classes\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m2\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mroi_heads\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmask_in_features\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mNone\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mpixel_mean\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m[\u001b[39m\u001b[38;5;141m37.647\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m36.028\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m34.562\u001b[39m\u001b[38;5;15m]\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mpixel_std\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m[\u001b[39m\u001b[38;5;141m22.318\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m17.559\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m14.245\u001b[39m\u001b[38;5;15m]\u001b[39m\n",
      "\n",
      "\u001b[38;5;245m# Initialization and trainer settings\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmodel_zoo\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mget_config\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mcommon/train.py\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mtrain\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mamp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15menabled\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mTrue\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mddp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mfp16_compression\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mTrue\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15minit_checkpoint\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;245m# \"./ckpt/cmae_base.pth\"\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./run/base/lr5e-4-wd0.1-bs64/model_final.pth\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\n",
      "\u001b[38;5;245m# Schedule\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmax_iter\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m32203\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15meval_period\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m2000\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mlog_period\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m100\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15moutput_dir\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./run/base/lr5e-4-wd0.1-bs64\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mlr_multiplier\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mWarmupParamScheduler\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mscheduler\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mL\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mMultiStepParamScheduler\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m        \u001b[39m\u001b[38;5;15mvalues\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m[\u001b[39m\u001b[38;5;141m1.0\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.1\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.01\u001b[39m\u001b[38;5;15m]\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m        \u001b[39m\u001b[38;5;15mmilestones\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m[\u001b[39m\u001b[38;5;141m28982\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m30592\u001b[39m\u001b[38;5;15m]\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m        \u001b[39m\u001b[38;5;15mnum_updates\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmax_iter\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mwarmup_length\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m500\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m/\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mmax_iter\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mwarmup_factor\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m0.001\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\n",
      "\u001b[38;5;245m# Optimizer\u001b[39m\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mmodel_zoo\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mget_config\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mcommon/optim.py\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mAdamW\u001b[39m\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mlr\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m5e-4\u001b[39m\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mweight_decay\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.1\u001b[39m\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mparams\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mlr_factor_func\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mnum_layers\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m12\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlr_decay_rate\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m0.7\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mparams\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15moverrides\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m{\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mpos_embed\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m:\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m{\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186mweight_decay\u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;15m:\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.0\u001b[39m\u001b[38;5;15m}\u001b[39m\u001b[38;5;15m}\u001b[39m\n",
      "\n",
      "\u001b[32m[05/16 11:04:14 detectron2]: \u001b[0mFull config saved to ./run/base/lr5e-4-wd0.1-bs64/config.yaml\n",
      "\u001b[32m[05/16 11:04:14 d2.utils.env]: \u001b[0mUsing a generated random seed 14071219\n",
      "\u001b[32m[05/16 11:04:15 d2.checkpoint.detection_checkpoint]: \u001b[0m[DetectionCheckpointer] Loading from ./run/base/lr5e-4-wd0.1-bs64/model_final.pth ...\n",
      "\u001b[32m[05/16 11:04:15 fvcore.common.checkpoint]: \u001b[0m[Checkpointer] Loading from ./run/base/lr5e-4-wd0.1-bs64/model_final.pth ...\n",
      "\u001b[5m\u001b[31mWARNING\u001b[0m \u001b[32m[05/16 11:04:16 d2.data.datasets.coco]: \u001b[0m\n",
      "Category ids in annotations are not in [1, #categories]! We'll apply a mapping for you.\n",
      "\n",
      "\u001b[32m[05/16 11:04:16 d2.data.datasets.coco]: \u001b[0mLoaded 1289 images in COCO format from /root/DataSet/Neurlens/annotations/instances_val.json\n",
      "\u001b[32m[05/16 11:04:16 d2.data.dataset_mapper]: \u001b[0m[DatasetMapper] Augmentations used in inference: [ResizeShortestEdge(short_edge_length=(512, 512), max_size=512)]\n",
      "\u001b[32m[05/16 11:04:16 d2.data.common]: \u001b[0mSerializing the dataset using: <class 'detectron2.data.common._TorchSerializedList'>\n",
      "\u001b[32m[05/16 11:04:16 d2.data.common]: \u001b[0mSerializing 1289 elements to byte tensors and concatenating them all ...\n",
      "\u001b[32m[05/16 11:04:16 d2.data.common]: \u001b[0mSerialized dataset takes 0.32 MiB\n",
      "\u001b[32m[05/16 11:04:16 d2.evaluation.evaluator]: \u001b[0mStart inference on 1289 batches\n",
      "\u001b[32m[05/16 11:04:17 d2.evaluation.evaluator]: \u001b[0mInference done 11/1289. Dataloading: 0.0005 s/iter. Inference: 0.0554 s/iter. Eval: 0.0002 s/iter. Total: 0.0561 s/iter. ETA=0:01:11\n",
      "\u001b[32m[05/16 11:04:22 d2.evaluation.evaluator]: \u001b[0mInference done 100/1289. Dataloading: 0.0008 s/iter. Inference: 0.0557 s/iter. Eval: 0.0002 s/iter. Total: 0.0567 s/iter. ETA=0:01:07\n",
      "\u001b[32m[05/16 11:04:27 d2.evaluation.evaluator]: \u001b[0mInference done 189/1289. Dataloading: 0.0008 s/iter. Inference: 0.0556 s/iter. Eval: 0.0002 s/iter. Total: 0.0566 s/iter. ETA=0:01:02\n",
      "\u001b[32m[05/16 11:04:32 d2.evaluation.evaluator]: \u001b[0mInference done 278/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0565 s/iter. ETA=0:00:57\n",
      "\u001b[32m[05/16 11:04:37 d2.evaluation.evaluator]: \u001b[0mInference done 367/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0565 s/iter. ETA=0:00:52\n",
      "\u001b[32m[05/16 11:04:42 d2.evaluation.evaluator]: \u001b[0mInference done 456/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0565 s/iter. ETA=0:00:47\n",
      "\u001b[32m[05/16 11:04:47 d2.evaluation.evaluator]: \u001b[0mInference done 545/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0566 s/iter. ETA=0:00:42\n",
      "\u001b[32m[05/16 11:04:52 d2.evaluation.evaluator]: \u001b[0mInference done 634/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0566 s/iter. ETA=0:00:37\n",
      "\u001b[32m[05/16 11:04:57 d2.evaluation.evaluator]: \u001b[0mInference done 723/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0002 s/iter. Total: 0.0565 s/iter. ETA=0:00:31\n",
      "\u001b[32m[05/16 11:05:02 d2.evaluation.evaluator]: \u001b[0mInference done 813/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0001 s/iter. Total: 0.0565 s/iter. ETA=0:00:26\n",
      "\u001b[32m[05/16 11:05:07 d2.evaluation.evaluator]: \u001b[0mInference done 903/1289. Dataloading: 0.0008 s/iter. Inference: 0.0555 s/iter. Eval: 0.0001 s/iter. Total: 0.0564 s/iter. ETA=0:00:21\n",
      "\u001b[32m[05/16 11:05:12 d2.evaluation.evaluator]: \u001b[0mInference done 993/1289. Dataloading: 0.0008 s/iter. Inference: 0.0554 s/iter. Eval: 0.0001 s/iter. Total: 0.0564 s/iter. ETA=0:00:16\n",
      "\u001b[32m[05/16 11:05:17 d2.evaluation.evaluator]: \u001b[0mInference done 1082/1289. Dataloading: 0.0008 s/iter. Inference: 0.0554 s/iter. Eval: 0.0001 s/iter. Total: 0.0564 s/iter. ETA=0:00:11\n",
      "\u001b[32m[05/16 11:05:22 d2.evaluation.evaluator]: \u001b[0mInference done 1171/1289. Dataloading: 0.0008 s/iter. Inference: 0.0554 s/iter. Eval: 0.0001 s/iter. Total: 0.0564 s/iter. ETA=0:00:06\n",
      "\u001b[32m[05/16 11:05:27 d2.evaluation.evaluator]: \u001b[0mInference done 1260/1289. Dataloading: 0.0008 s/iter. Inference: 0.0554 s/iter. Eval: 0.0001 s/iter. Total: 0.0564 s/iter. ETA=0:00:01\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.evaluator]: \u001b[0mTotal inference time: 0:01:12.490019 (0.056456 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.evaluator]: \u001b[0mTotal inference pure compute time: 0:01:11 (0.055398 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.coco_evaluation]: \u001b[0mPreparing results for COCO format ...\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.coco_evaluation]: \u001b[0mEvaluating predictions with unofficial COCO API...\n",
      "Loading and preparing results...\n",
      "DONE (t=0.00s)\n",
      "creating index...\n",
      "index created!\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.fast_eval_api]: \u001b[0mEvaluate annotation type *bbox*\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.evaluate() finished in 0.06 seconds.\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.fast_eval_api]: \u001b[0mAccumulating evaluation results...\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.accumulate() finished in 0.01 seconds.\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.399\n",
      " Average Precision  (AP) @[ IoU=0.50      | area=   all | maxDets=100 ] = 0.492\n",
      " Average Precision  (AP) @[ IoU=0.75      | area=   all | maxDets=100 ] = 0.457\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.388\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.817\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.736\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=  1 ] = 0.418\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets= 10 ] = 0.425\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.425\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.406\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.867\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.799\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.coco_evaluation]: \u001b[0mEvaluation results for bbox: \n",
      "|   AP   |  AP50  |  AP75  |  APs   |  APm   |  APl   |\n",
      "|:------:|:------:|:------:|:------:|:------:|:------:|\n",
      "| 39.882 | 49.218 | 45.701 | 38.841 | 81.744 | 73.584 |\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.coco_evaluation]: \u001b[0mPer-category bbox AP: \n",
      "| category   | AP    | category   | AP     |\n",
      "|:-----------|:------|:-----------|:-------|\n",
      "| BG         | 0.000 | lens       | 79.764 |\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.testing]: \u001b[0mcopypaste: Task: bbox\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.testing]: \u001b[0mcopypaste: AP,AP50,AP75,APs,APm,APl\n",
      "\u001b[32m[05/16 11:05:29 d2.evaluation.testing]: \u001b[0mcopypaste: 39.8818,49.2185,45.7007,38.8405,81.7444,73.5844\n",
      "OrderedDict([('bbox', {'AP': 39.88178391218254, 'AP50': 49.218494369377254, 'AP75': 45.7007266855179, 'APs': 38.84052959074099, 'APm': 81.74439340237494, 'APl': 73.58442634377406, 'AP-BG': 0.0, 'AP-lens': 79.76356782436508})])\n",
      "\u001b[32m[05/16 11:05:29 detectron2]: \u001b[0mRank of current process: 0. World size: 1\n",
      "\u001b[32m[05/16 11:05:29 detectron2]: \u001b[0mRank of current process: 0. World size: 1\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mEnvironment info:\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "sys.platform                     linux\n",
      "Python                           3.8.10 (default, Apr 16 2024, 18:43:55) [GCC 7.5.0]\n",
      "numpy                            1.24.4\n",
      "detectron2                       0.6 @/root/venv_ObjectDetect/ViT-R-CNN/detectron2/detectron2\n",
      "Compiler                         GCC 7.5\n",
      "CUDA compiler                    CUDA 11.4\n",
      "detectron2 arch flags            8.6\n",
      "DETECTRON2_ENV_MODULE            <not set>\n",
      "PyTorch                          1.12.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torch\n",
      "PyTorch debug build              False\n",
      "torch._C._GLIBCXX_USE_CXX11_ABI  False\n",
      "GPU available                    Yes\n",
      "GPU 0,1,2,3,4,5,6,7              NVIDIA A40 (arch=8.6)\n",
      "Driver version                   470.182.03\n",
      "CUDA_HOME                        /usr/local/cuda-11.4\n",
      "Pillow                           10.3.0\n",
      "torchvision                      0.13.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torchvision\n",
      "torchvision arch flags           3.5, 5.0, 6.0, 7.0, 7.5, 8.0, 8.6\n",
      "fvcore                           0.1.5.post20221221\n",
      "iopath                           0.1.9\n",
      "cv2                              4.9.0\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "PyTorch built with:\n",
      "  - GCC 9.3\n",
      "  - C++ Version: 201402\n",
      "  - Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications\n",
      "  - Intel(R) MKL-DNN v2.6.0 (Git Hash 52b5f107dd9cf10910aaa19cb47f3abf9b349815)\n",
      "  - OpenMP 201511 (a.k.a. OpenMP 4.5)\n",
      "  - LAPACK is enabled (usually provided by MKL)\n",
      "  - NNPACK is enabled\n",
      "  - CPU capability usage: AVX2\n",
      "  - CUDA Runtime 11.3\n",
      "  - NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70;-gencode;arch=compute_75,code=sm_75;-gencode;arch=compute_80,code=sm_80;-gencode;arch=compute_86,code=sm_86\n",
      "  - CuDNN 8.3.2  (built against CUDA 11.5)\n",
      "  - Magma 2.5.2\n",
      "  - Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=11.3, CUDNN_VERSION=8.3.2, CXX_COMPILER=/opt/rh/devtoolset-9/root/usr/bin/c++, CXX_FLAGS= -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -DSYMBOLICATE_MOBILE_DEBUG_HANDLE -DEDGE_PROFILER_USE_KINETO -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wno-unused-parameter -Wno-unused-function -Wno-unused-result -Wno-unused-local-typedefs -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Werror=cast-function-type -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.12.0, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=OFF, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, USE_ROCM=OFF, \n",
      "\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mEnvironment info:\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "sys.platform                     linux\n",
      "Python                           3.8.10 (default, Apr 16 2024, 18:43:55) [GCC 7.5.0]\n",
      "numpy                            1.24.4\n",
      "detectron2                       0.6 @/root/venv_ObjectDetect/ViT-R-CNN/detectron2/detectron2\n",
      "Compiler                         GCC 7.5\n",
      "CUDA compiler                    CUDA 11.4\n",
      "detectron2 arch flags            8.6\n",
      "DETECTRON2_ENV_MODULE            <not set>\n",
      "PyTorch                          1.12.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torch\n",
      "PyTorch debug build              False\n",
      "torch._C._GLIBCXX_USE_CXX11_ABI  False\n",
      "GPU available                    Yes\n",
      "GPU 0,1,2,3,4,5,6,7              NVIDIA A40 (arch=8.6)\n",
      "Driver version                   470.182.03\n",
      "CUDA_HOME                        /usr/local/cuda-11.4\n",
      "Pillow                           10.3.0\n",
      "torchvision                      0.13.0+cu113 @/root/venv_ObjectDetect/lib/python3.8/site-packages/torchvision\n",
      "torchvision arch flags           3.5, 5.0, 6.0, 7.0, 7.5, 8.0, 8.6\n",
      "fvcore                           0.1.5.post20221221\n",
      "iopath                           0.1.9\n",
      "cv2                              4.9.0\n",
      "-------------------------------  -----------------------------------------------------------------------------\n",
      "PyTorch built with:\n",
      "  - GCC 9.3\n",
      "  - C++ Version: 201402\n",
      "  - Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications\n",
      "  - Intel(R) MKL-DNN v2.6.0 (Git Hash 52b5f107dd9cf10910aaa19cb47f3abf9b349815)\n",
      "  - OpenMP 201511 (a.k.a. OpenMP 4.5)\n",
      "  - LAPACK is enabled (usually provided by MKL)\n",
      "  - NNPACK is enabled\n",
      "  - CPU capability usage: AVX2\n",
      "  - CUDA Runtime 11.3\n",
      "  - NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70;-gencode;arch=compute_75,code=sm_75;-gencode;arch=compute_80,code=sm_80;-gencode;arch=compute_86,code=sm_86\n",
      "  - CuDNN 8.3.2  (built against CUDA 11.5)\n",
      "  - Magma 2.5.2\n",
      "  - Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=11.3, CUDNN_VERSION=8.3.2, CXX_COMPILER=/opt/rh/devtoolset-9/root/usr/bin/c++, CXX_FLAGS= -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -DSYMBOLICATE_MOBILE_DEBUG_HANDLE -DEDGE_PROFILER_USE_KINETO -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wno-unused-parameter -Wno-unused-function -Wno-unused-result -Wno-unused-local-typedefs -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Werror=cast-function-type -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.12.0, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=OFF, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, USE_ROCM=OFF, \n",
      "\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mCommand line arguments: Namespace(config_file='./configs/mask_rcnn_vit_l.py', dist_url='tcp://127.0.0.1:49152', eval_only=True, machine_rank=0, num_gpus=1, num_machines=1, opts=[], resume=False)\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mCommand line arguments: Namespace(config_file='./configs/mask_rcnn_vit_l.py', dist_url='tcp://127.0.0.1:49152', eval_only=True, machine_rank=0, num_gpus=1, num_machines=1, opts=[], resume=False)\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mContents of args.config_file=./configs/mask_rcnn_vit_l.py:\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mfunctools\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\n",
      "\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mmask_rcnn_vit_b\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mlr_multiplier\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15membed_dim\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m1024\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdepth\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m24\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnum_heads\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m16\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdrop_path_rate\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.1\u001b[39m\n",
      "\u001b[38;5;245m# 5, 11, 17, 23 for global attention\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mwindow_block_indexes\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m0\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m5\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m6\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m11\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m12\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m17\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m18\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m23\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mamp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15menabled\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mddp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mfp16_compression\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15minit_checkpoint\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;245m# \"./ckpt/cmae_large.pth\"\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./large/lr5e-4-wd0.1-ld0.9/model_final.pth\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15moutput_dir\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./large/lr5e-4-wd0.1-ld0.9\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mparams\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mlr_factor_func\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mnum_layers\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m24\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlr_decay_rate\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m0.9\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mContents of args.config_file=./configs/mask_rcnn_vit_l.py:\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mfunctools\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\n",
      "\n",
      "\u001b[38;5;204mfrom\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m.\u001b[39m\u001b[38;5;15mmask_rcnn_vit_b\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204mimport\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mdataloader\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mlr_multiplier\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\u001b[38;5;15m,\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15membed_dim\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m1024\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdepth\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m24\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnum_heads\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m16\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mdrop_path_rate\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m0.1\u001b[39m\n",
      "\u001b[38;5;245m# 5, 11, 17, 23 for global attention\u001b[39m\n",
      "\u001b[38;5;15mmodel\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mbackbone\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mnet\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mwindow_block_indexes\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m0\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m5\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m6\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m11\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m12\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m17\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m+\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlist\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mrange\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;141m18\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;141m23\u001b[39m\u001b[38;5;15m)\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mamp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15menabled\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mddp\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mfp16_compression\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;81mFalse\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15minit_checkpoint\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15m(\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;245m# \"./ckpt/cmae_large.pth\"\u001b[39m\n",
      "\u001b[38;5;15m    \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./large/lr5e-4-wd0.1-ld0.9/model_final.pth\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\u001b[38;5;15m)\u001b[39m\n",
      "\u001b[38;5;15mtrain\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15moutput_dir\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;186m\"\u001b[39m\u001b[38;5;186m./large/lr5e-4-wd0.1-ld0.9\u001b[39m\u001b[38;5;186m\"\u001b[39m\n",
      "\n",
      "\u001b[38;5;15moptimizer\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mparams\u001b[39m\u001b[38;5;204m.\u001b[39m\u001b[38;5;15mlr_factor_func\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mpartial\u001b[39m\u001b[38;5;15m(\u001b[39m\u001b[38;5;15mget_vit_lr_decay_rate\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mnum_layers\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m24\u001b[39m\u001b[38;5;15m,\u001b[39m\u001b[38;5;15m \u001b[39m\u001b[38;5;15mlr_decay_rate\u001b[39m\u001b[38;5;204m=\u001b[39m\u001b[38;5;141m0.9\u001b[39m\u001b[38;5;15m)\u001b[39m\n",
      "\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mFull config saved to ./large/lr5e-4-wd0.1-ld0.9/config.yaml\n",
      "\u001b[32m[05/16 11:05:31 detectron2]: \u001b[0mFull config saved to ./large/lr5e-4-wd0.1-ld0.9/config.yaml\n",
      "\u001b[32m[05/16 11:05:31 d2.utils.env]: \u001b[0mUsing a generated random seed 31387514\n",
      "\u001b[32m[05/16 11:05:31 d2.utils.env]: \u001b[0mUsing a generated random seed 31387514\n",
      "\u001b[32m[05/16 11:05:35 d2.checkpoint.detection_checkpoint]: \u001b[0m[DetectionCheckpointer] Loading from ./large/lr5e-4-wd0.1-ld0.9/model_final.pth ...\n",
      "\u001b[32m[05/16 11:05:35 d2.checkpoint.detection_checkpoint]: \u001b[0m[DetectionCheckpointer] Loading from ./large/lr5e-4-wd0.1-ld0.9/model_final.pth ...\n",
      "\u001b[32m[05/16 11:05:35 fvcore.common.checkpoint]: \u001b[0m[Checkpointer] Loading from ./large/lr5e-4-wd0.1-ld0.9/model_final.pth ...\n",
      "\u001b[32m[05/16 11:05:35 fvcore.common.checkpoint]: \u001b[0m[Checkpointer] Loading from ./large/lr5e-4-wd0.1-ld0.9/model_final.pth ...\n",
      "\u001b[5m\u001b[31mWARNING\u001b[0m \u001b[32m[05/16 11:05:38 d2.data.datasets.coco]: \u001b[0m\n",
      "Category ids in annotations are not in [1, #categories]! We'll apply a mapping for you.\n",
      "\n",
      "\u001b[5m\u001b[31mWARNING\u001b[0m \u001b[32m[05/16 11:05:38 d2.data.datasets.coco]: \u001b[0m\n",
      "Category ids in annotations are not in [1, #categories]! We'll apply a mapping for you.\n",
      "\n",
      "\u001b[32m[05/16 11:05:38 d2.data.datasets.coco]: \u001b[0mLoaded 1289 images in COCO format from /root/DataSet/Neurlens/annotations/instances_val.json\n",
      "\u001b[32m[05/16 11:05:38 d2.data.datasets.coco]: \u001b[0mLoaded 1289 images in COCO format from /root/DataSet/Neurlens/annotations/instances_val.json\n",
      "\u001b[32m[05/16 11:05:38 d2.data.dataset_mapper]: \u001b[0m[DatasetMapper] Augmentations used in inference: [ResizeShortestEdge(short_edge_length=(512, 512), max_size=512)]\n",
      "\u001b[32m[05/16 11:05:38 d2.data.dataset_mapper]: \u001b[0m[DatasetMapper] Augmentations used in inference: [ResizeShortestEdge(short_edge_length=(512, 512), max_size=512)]\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerializing the dataset using: <class 'detectron2.data.common._TorchSerializedList'>\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerializing the dataset using: <class 'detectron2.data.common._TorchSerializedList'>\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerializing 1289 elements to byte tensors and concatenating them all ...\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerializing 1289 elements to byte tensors and concatenating them all ...\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerialized dataset takes 0.32 MiB\n",
      "\u001b[32m[05/16 11:05:38 d2.data.common]: \u001b[0mSerialized dataset takes 0.32 MiB\n",
      "\u001b[32m[05/16 11:05:38 d2.evaluation.evaluator]: \u001b[0mStart inference on 1289 batches\n",
      "\u001b[32m[05/16 11:05:38 d2.evaluation.evaluator]: \u001b[0mStart inference on 1289 batches\n",
      "\u001b[32m[05/16 11:05:40 d2.evaluation.evaluator]: \u001b[0mInference done 11/1289. Dataloading: 0.0005 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1074 s/iter. ETA=0:02:17\n",
      "\u001b[32m[05/16 11:05:40 d2.evaluation.evaluator]: \u001b[0mInference done 11/1289. Dataloading: 0.0005 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1074 s/iter. ETA=0:02:17\n",
      "\u001b[32m[05/16 11:05:45 d2.evaluation.evaluator]: \u001b[0mInference done 58/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:02:12\n",
      "\u001b[32m[05/16 11:05:45 d2.evaluation.evaluator]: \u001b[0mInference done 58/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:02:12\n",
      "\u001b[32m[05/16 11:05:51 d2.evaluation.evaluator]: \u001b[0mInference done 105/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:02:07\n",
      "\u001b[32m[05/16 11:05:51 d2.evaluation.evaluator]: \u001b[0mInference done 105/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:02:07\n",
      "\u001b[32m[05/16 11:05:56 d2.evaluation.evaluator]: \u001b[0mInference done 152/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:02:02\n",
      "\u001b[32m[05/16 11:05:56 d2.evaluation.evaluator]: \u001b[0mInference done 152/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:02:02\n",
      "\u001b[32m[05/16 11:06:01 d2.evaluation.evaluator]: \u001b[0mInference done 199/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:57\n",
      "\u001b[32m[05/16 11:06:01 d2.evaluation.evaluator]: \u001b[0mInference done 199/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:57\n",
      "\u001b[32m[05/16 11:06:06 d2.evaluation.evaluator]: \u001b[0mInference done 246/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:52\n",
      "\u001b[32m[05/16 11:06:06 d2.evaluation.evaluator]: \u001b[0mInference done 246/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:52\n",
      "\u001b[32m[05/16 11:06:11 d2.evaluation.evaluator]: \u001b[0mInference done 293/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:47\n",
      "\u001b[32m[05/16 11:06:11 d2.evaluation.evaluator]: \u001b[0mInference done 293/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1077 s/iter. ETA=0:01:47\n",
      "\u001b[32m[05/16 11:06:16 d2.evaluation.evaluator]: \u001b[0mInference done 340/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:42\n",
      "\u001b[32m[05/16 11:06:16 d2.evaluation.evaluator]: \u001b[0mInference done 340/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:42\n",
      "\u001b[32m[05/16 11:06:21 d2.evaluation.evaluator]: \u001b[0mInference done 387/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:37\n",
      "\u001b[32m[05/16 11:06:21 d2.evaluation.evaluator]: \u001b[0mInference done 387/1289. Dataloading: 0.0008 s/iter. Inference: 0.1067 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:37\n",
      "\u001b[32m[05/16 11:06:26 d2.evaluation.evaluator]: \u001b[0mInference done 434/1289. Dataloading: 0.0008 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:32\n",
      "\u001b[32m[05/16 11:06:26 d2.evaluation.evaluator]: \u001b[0mInference done 434/1289. Dataloading: 0.0008 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1078 s/iter. ETA=0:01:32\n",
      "\u001b[32m[05/16 11:06:31 d2.evaluation.evaluator]: \u001b[0mInference done 481/1289. Dataloading: 0.0008 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1079 s/iter. ETA=0:01:27\n",
      "\u001b[32m[05/16 11:06:31 d2.evaluation.evaluator]: \u001b[0mInference done 481/1289. Dataloading: 0.0008 s/iter. Inference: 0.1068 s/iter. Eval: 0.0002 s/iter. Total: 0.1079 s/iter. ETA=0:01:27\n",
      "\u001b[32m[05/16 11:06:36 d2.evaluation.evaluator]: \u001b[0mInference done 528/1289. Dataloading: 0.0008 s/iter. Inference: 0.1069 s/iter. Eval: 0.0002 s/iter. Total: 0.1080 s/iter. ETA=0:01:22\n",
      "\u001b[32m[05/16 11:06:36 d2.evaluation.evaluator]: \u001b[0mInference done 528/1289. Dataloading: 0.0008 s/iter. Inference: 0.1069 s/iter. Eval: 0.0002 s/iter. Total: 0.1080 s/iter. ETA=0:01:22\n",
      "\u001b[32m[05/16 11:06:41 d2.evaluation.evaluator]: \u001b[0mInference done 574/1289. Dataloading: 0.0008 s/iter. Inference: 0.1070 s/iter. Eval: 0.0002 s/iter. Total: 0.1080 s/iter. ETA=0:01:17\n",
      "\u001b[32m[05/16 11:06:41 d2.evaluation.evaluator]: \u001b[0mInference done 574/1289. Dataloading: 0.0008 s/iter. Inference: 0.1070 s/iter. Eval: 0.0002 s/iter. Total: 0.1080 s/iter. ETA=0:01:17\n",
      "\u001b[32m[05/16 11:06:46 d2.evaluation.evaluator]: \u001b[0mInference done 620/1289. Dataloading: 0.0008 s/iter. Inference: 0.1070 s/iter. Eval: 0.0002 s/iter. Total: 0.1081 s/iter. ETA=0:01:12\n",
      "\u001b[32m[05/16 11:06:46 d2.evaluation.evaluator]: \u001b[0mInference done 620/1289. Dataloading: 0.0008 s/iter. Inference: 0.1070 s/iter. Eval: 0.0002 s/iter. Total: 0.1081 s/iter. ETA=0:01:12\n",
      "\u001b[32m[05/16 11:06:51 d2.evaluation.evaluator]: \u001b[0mInference done 667/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0002 s/iter. Total: 0.1081 s/iter. ETA=0:01:07\n",
      "\u001b[32m[05/16 11:06:51 d2.evaluation.evaluator]: \u001b[0mInference done 667/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0002 s/iter. Total: 0.1081 s/iter. ETA=0:01:07\n",
      "\u001b[32m[05/16 11:06:56 d2.evaluation.evaluator]: \u001b[0mInference done 713/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0002 s/iter. Total: 0.1082 s/iter. ETA=0:01:02\n",
      "\u001b[32m[05/16 11:06:56 d2.evaluation.evaluator]: \u001b[0mInference done 713/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0002 s/iter. Total: 0.1082 s/iter. ETA=0:01:02\n",
      "\u001b[32m[05/16 11:07:01 d2.evaluation.evaluator]: \u001b[0mInference done 760/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:57\n",
      "\u001b[32m[05/16 11:07:01 d2.evaluation.evaluator]: \u001b[0mInference done 760/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:57\n",
      "\u001b[32m[05/16 11:07:06 d2.evaluation.evaluator]: \u001b[0mInference done 807/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:52\n",
      "\u001b[32m[05/16 11:07:06 d2.evaluation.evaluator]: \u001b[0mInference done 807/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:52\n",
      "\u001b[32m[05/16 11:07:12 d2.evaluation.evaluator]: \u001b[0mInference done 854/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:47\n",
      "\u001b[32m[05/16 11:07:12 d2.evaluation.evaluator]: \u001b[0mInference done 854/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:47\n",
      "\u001b[32m[05/16 11:07:17 d2.evaluation.evaluator]: \u001b[0mInference done 901/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:41\n",
      "\u001b[32m[05/16 11:07:17 d2.evaluation.evaluator]: \u001b[0mInference done 901/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:41\n",
      "\u001b[32m[05/16 11:07:22 d2.evaluation.evaluator]: \u001b[0mInference done 948/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:36\n",
      "\u001b[32m[05/16 11:07:22 d2.evaluation.evaluator]: \u001b[0mInference done 948/1289. Dataloading: 0.0008 s/iter. Inference: 0.1071 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:36\n",
      "\u001b[32m[05/16 11:07:27 d2.evaluation.evaluator]: \u001b[0mInference done 995/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:31\n",
      "\u001b[32m[05/16 11:07:27 d2.evaluation.evaluator]: \u001b[0mInference done 995/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:31\n",
      "\u001b[32m[05/16 11:07:32 d2.evaluation.evaluator]: \u001b[0mInference done 1042/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:26\n",
      "\u001b[32m[05/16 11:07:32 d2.evaluation.evaluator]: \u001b[0mInference done 1042/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:26\n",
      "\u001b[32m[05/16 11:07:37 d2.evaluation.evaluator]: \u001b[0mInference done 1089/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:21\n",
      "\u001b[32m[05/16 11:07:37 d2.evaluation.evaluator]: \u001b[0mInference done 1089/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:21\n",
      "\u001b[32m[05/16 11:07:42 d2.evaluation.evaluator]: \u001b[0mInference done 1136/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:16\n",
      "\u001b[32m[05/16 11:07:42 d2.evaluation.evaluator]: \u001b[0mInference done 1136/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:16\n",
      "\u001b[32m[05/16 11:07:47 d2.evaluation.evaluator]: \u001b[0mInference done 1183/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:11\n",
      "\u001b[32m[05/16 11:07:47 d2.evaluation.evaluator]: \u001b[0mInference done 1183/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:11\n",
      "\u001b[32m[05/16 11:07:52 d2.evaluation.evaluator]: \u001b[0mInference done 1230/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:06\n",
      "\u001b[32m[05/16 11:07:52 d2.evaluation.evaluator]: \u001b[0mInference done 1230/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:06\n",
      "\u001b[32m[05/16 11:07:57 d2.evaluation.evaluator]: \u001b[0mInference done 1277/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:01\n",
      "\u001b[32m[05/16 11:07:57 d2.evaluation.evaluator]: \u001b[0mInference done 1277/1289. Dataloading: 0.0008 s/iter. Inference: 0.1072 s/iter. Eval: 0.0001 s/iter. Total: 0.1082 s/iter. ETA=0:00:01\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.evaluator]: \u001b[0mTotal inference time: 0:02:19.088075 (0.108324 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.evaluator]: \u001b[0mTotal inference time: 0:02:19.088075 (0.108324 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.evaluator]: \u001b[0mTotal inference pure compute time: 0:02:17 (0.107187 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.evaluator]: \u001b[0mTotal inference pure compute time: 0:02:17 (0.107187 s / iter per device, on 1 devices)\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mPreparing results for COCO format ...\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mPreparing results for COCO format ...\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mEvaluating predictions with unofficial COCO API...\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mEvaluating predictions with unofficial COCO API...\n",
      "Loading and preparing results...\n",
      "DONE (t=0.00s)\n",
      "creating index...\n",
      "index created!\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mEvaluate annotation type *bbox*\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mEvaluate annotation type *bbox*\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.evaluate() finished in 0.06 seconds.\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.evaluate() finished in 0.06 seconds.\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mAccumulating evaluation results...\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mAccumulating evaluation results...\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.accumulate() finished in 0.01 seconds.\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.fast_eval_api]: \u001b[0mCOCOeval_opt.accumulate() finished in 0.01 seconds.\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.413\n",
      " Average Precision  (AP) @[ IoU=0.50      | area=   all | maxDets=100 ] = 0.494\n",
      " Average Precision  (AP) @[ IoU=0.75      | area=   all | maxDets=100 ] = 0.470\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.397\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.852\n",
      " Average Precision  (AP) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.728\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=  1 ] = 0.434\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets= 10 ] = 0.437\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=   all | maxDets=100 ] = 0.437\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area= small | maxDets=100 ] = 0.418\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area=medium | maxDets=100 ] = 0.896\n",
      " Average Recall     (AR) @[ IoU=0.50:0.95 | area= large | maxDets=100 ] = 0.794\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mEvaluation results for bbox: \n",
      "|   AP   |  AP50  |  AP75  |  APs   |  APm   |  APl   |\n",
      "|:------:|:------:|:------:|:------:|:------:|:------:|\n",
      "| 41.313 | 49.375 | 47.042 | 39.721 | 85.198 | 72.785 |\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mEvaluation results for bbox: \n",
      "|   AP   |  AP50  |  AP75  |  APs   |  APm   |  APl   |\n",
      "|:------:|:------:|:------:|:------:|:------:|:------:|\n",
      "| 41.313 | 49.375 | 47.042 | 39.721 | 85.198 | 72.785 |\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mPer-category bbox AP: \n",
      "| category   | AP    | category   | AP     |\n",
      "|:-----------|:------|:-----------|:-------|\n",
      "| BG         | 0.000 | lens       | 82.626 |\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.coco_evaluation]: \u001b[0mPer-category bbox AP: \n",
      "| category   | AP    | category   | AP     |\n",
      "|:-----------|:------|:-----------|:-------|\n",
      "| BG         | 0.000 | lens       | 82.626 |\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: Task: bbox\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: Task: bbox\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: AP,AP50,AP75,APs,APm,APl\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: AP,AP50,AP75,APs,APm,APl\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: 41.3128,49.3752,47.0417,39.7212,85.1983,72.7848\n",
      "\u001b[32m[05/16 11:07:59 d2.evaluation.testing]: \u001b[0mcopypaste: 41.3128,49.3752,47.0417,39.7212,85.1983,72.7848\n",
      "OrderedDict([('bbox', {'AP': 41.312812861193606, 'AP50': 49.37523403229914, 'AP75': 47.04165445507224, 'APs': 39.721216402163044, 'APm': 85.19832276515407, 'APl': 72.78479384201859, 'AP-BG': 0.0, 'AP-lens': 82.62562572238721})])\n"
     ]
    }
   ],
   "source": [
    "import warnings\n",
    "\n",
    "warnings.filterwarnings('ignore')\n",
    "\n",
    "%run lazyconfig_train_net.py --config-file ./configs/mask_rcnn_vit_b.py --eval-only\n",
    "\n",
    "%run lazyconfig_train_net.py --config-file ./configs/mask_rcnn_vit_l.py --eval-only"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "venv_ObjectDetect",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "fe06d0f75ca04f5e91fc552fa754d241604db3f2641104ecd76b3cf8be778666"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
