CLASS_NAMES: ['Car', 'Pedestrian', 'Cyclist']  # 'Pedestrian', 'Cyclist'

DATA_CONFIG:
    _BASE_CONFIG_: cfgs/dataset_configs/kitti_dataset.yaml
    GET_ITEM_LIST: ['points', 'images', 'calib_matricies', 'segmentation', 'gt_boxes2d']

    DATA_AUGMENTOR:
        DISABLE_AUG_LIST: ['placeholder']
        AUG_CONFIG_LIST:
            -   NAME: gt_sampling
                AUG_WITH_IMAGE: True # use PC-Image Aug
                JOINT_SAMPLE: True # joint sample with point
                KEEP_RAW: False # keep original PC
                POINT_REFINE: True # refine points with different calib
                BOX_IOU_THRES: 0.5
                IMG_AUG_TYPE: by_depth
                AUG_USE_TYPE: annotation
                IMG_ROOT_PATH: training/image_2

                USE_ROAD_PLANE: True
                DB_INFO_PATH:
                    - kitti_dbinfos_train.pkl
                PREPARE: {
                        filter_by_min_points: [ 'Car:5', 'Pedestrian:10', 'Cyclist:10'],  # 'Pedestrian:10', 'Cyclist:10'
                        filter_by_difficulty: [ -1 ],
                    }

                SAMPLE_GROUPS: [ 'Car: 15', 'Pedestrian:8', 'Cyclist:8']
                NUM_POINT_FEATURES: 4
                DATABASE_WITH_FAKELIDAR: False
                REMOVE_EXTRA_WIDTH: [0.0, 0.0, 0.0]
                LIMIT_WHOLE_SCENE: False
        
            -   NAME: random_world_flip
                ENABLE_PROB: 0.5
                ALONG_AXIS_LIST: [ 'x' ]
        
            -   NAME: random_world_rotation
                ENABLE_PROB: 0.5
                WORLD_ROT_ANGLE: [ -0.78539816, 0.78539816 ]
        
            -   NAME: random_world_scaling
                ENABLE_PROB: 0.5
                WORLD_SCALE_RANGE: [ 0.9, 1.1 ]

    DATA_PROCESSOR:
        -   NAME: mask_points_and_boxes_outside_range
            REMOVE_OUTSIDE_BOXES: True

        -   NAME: sample_points
            NUM_POINTS: {
                'train': 16384,
                'test': 16384
            }

        -   NAME: shuffle_points
            SHUFFLE_ENABLED: {
                'train': True,
                'test': False
            }

MODEL:
    NAME: BiProDet

    BACKBONE_3D:
        NAME: 3DSSD_Backbone
        SA_CONFIG:
            NPOINT_LIST: [[4096], [512, 512], [256, 256]]
            SAMPLE_RANGE_LIST: [[[0, 16384]], [[0, 4096], [0, 4096]], [[0, 512], [512, 1024]]]
            SAMPLE_METHOD_LIST: [['d-fps'], ['s-fps', 'd-fps'], ['s-fps', 'd-fps']]
            RADIUS: [[0.2, 0.4, 0.8], [0.4, 0.8, 1.6], [1.6, 3.2, 4.8]]
            NSAMPLE: [[32, 32, 64], [32, 32, 64], [32, 32, 64]]
            MLPS: [[[16, 16, 32], [16, 16, 32], [32, 32, 64]],
                   [[64, 64, 128], [64, 64, 128], [64, 96, 128]],
                   [[128, 128, 256], [128, 196, 256], [128, 256, 256]]]
            AGGREGATION_MLPS: [[64], [128], [256]]
            CONFIDENCE_MLPS: [[32], [64], []]
            IMAGE_BACKBONE_RATIO: 1.0
            WEIGHT_GAMMA: 1.0
            DILATED_RADIUS_GROUP: True
        FP_MLPS: [[32, 32, 64], [32, 32, 64], [64, 64, 128]]

    POINT_HEAD:
        NAME: PointHeadVote
        CLASS_AGNOSTIC: False
        USE_BN: True

        SAMPLE_RANGE: [ 0, 256 ]
        VOTE_CONFIG:
            VOTE_FC: [ 128 ]
            MAX_TRANSLATION_RANGE: [ 3.0, 3.0, 2.0 ]

        SA_CONFIG:
            RADIUS: [ 4.8, 6.4 ]
            NSAMPLE: [ 48, 64 ]
            MLPS: [[ 256, 256, 512 ],
                   [ 256, 512, 1024 ]]
        
        FP_CLS_FC: []
        PART_FC: []
        SHARED_FC: [ 512, 256 ]
        CLS_FC: [ 128 ]
        REG_FC: [ 128 ]

        TARGET_CONFIG:
            VOTE_EXTRA_WIDTH: [0.1, 0.1, 0.1]
            PART_EXTRA_WIDTH: [0.2, 0.2, 0.2]
            ASSIGN_METHOD: mask
            GT_CENTRAL_RADIUS: 10.0
            BOX_CODER: PointBinResidualCoder
            BOX_CODER_CONFIG: {
                'use_mean_size': False,
                'angle_bin_num': 12
            }

        LOSS_CONFIG:
            LOSS_CLS: WeightedBinaryCrossEntropyWithCenterness
            LOSS_REG: WeightedSmoothL1Loss
            LOSS_SASA_CONFIG: {
                'set_ignore_flag': True,
                'extra_width': [1.0, 1.0, 1.0],
                'layer_weights': [0.01, 0.1, 0]
            }
            AXIS_ALIGNED_IOU_LOSS_REGULARIZATION: True
            CORNER_LOSS_REGULARIZATION: True
            LOSS_WEIGHTS: {
                'vote_reg_weight': 1.0,
                'point_cls_weight': 1.0,
                'point_offset_reg_weight': 1.0,
                'point_angle_cls_weight': 1.0,
                'point_angle_reg_weight': 1.0,
                'point_iou_weight': 1.0,
                'point_corner_weight': 1.0,
            }

    ROI_HEAD:
        NAME: PDVHead
        CLASS_AGNOSTIC: True

        SHARED_FC: [256, 256]
        CLS_FC: [256, 256]
        REG_FC: [256, 256]
        DP_RATIO: 0.3

        NMS_CONFIG:
            TRAIN:
                NMS_TYPE: nms_gpu
                MULTI_CLASSES_NMS: False
                NMS_PRE_MAXSIZE: 9000
                NMS_POST_MAXSIZE: 512
                NMS_THRESH: 0.8
            TEST:
                NMS_TYPE: nms_gpu
                MULTI_CLASSES_NMS: False
                NMS_PRE_MAXSIZE: 1024
                NMS_POST_MAXSIZE: 100
                NMS_THRESH: 0.7

        # Density-aware RoI Grid
        ROI_GRID_POOL:
            # FEATURE_LOCATIONS: [x_conv3, x_conv4]
            GRID_SIZE: 6
            NUM_FEATURES: [64]
            POOL_LAYERS:
                MLPS: [[32, 32], [32, 32]]
                POOL_RADIUS: [0.4, 0.8]
                NSAMPLE: [16, 16]
                POOL_METHOD: max_pool
                USE_DENSITY: True

            ATTENTION:
                ENABLED: True
                NUM_FEATURES: 64
                NUM_HEADS: 1
                NUM_HIDDEN_FEATURES: 128
                NUM_LAYERS: 1
                POSITIONAL_ENCODER: density_grid_points
                MAX_NUM_BOXES: 20
                DROPOUT: 0.1
                COMBINE: True
                MASK_EMPTY_POINTS: True

        # Density confidence prediction
        DENSITY_CONFIDENCE:
            ENABLED: True
            GRID_SIZE: 1
            MAX_NUM_BOXES: 20
            ADD_SHARED_FEATURES: True

        TARGET_CONFIG:
            BOX_CODER: ResidualCoder
            ROI_PER_IMAGE: 128
            FG_RATIO: 0.5

            SAMPLE_ROI_BY_EACH_CLASS: True
            CLS_SCORE_TYPE: roi_iou

            CLS_FG_THRESH: 0.75
            CLS_BG_THRESH: 0.25
            CLS_BG_THRESH_LO: 0.1
            HARD_BG_RATIO: 0.8

            REG_FG_THRESH: 0.55

        LOSS_CONFIG:
            CLS_LOSS: BinaryCrossEntropy
            REG_LOSS: smooth-l1
            CORNER_LOSS_REGULARIZATION: True
            LOSS_WEIGHTS: {
                'rcnn_cls_weight': 1.0,
                'rcnn_reg_weight': 1.0,
                'rcnn_corner_weight': 1.0,
                'code_weights': [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]
            }

    POST_PROCESSING:
        RECALL_THRESH_LIST: [0.3, 0.5, 0.7]
        SCORE_THRESH: 0.1
        OUTPUT_RAW_SCORE: False

        EVAL_METRIC: kitti

        NMS_CONFIG:
            MULTI_CLASSES_NMS: False
            NMS_TYPE: nms_gpu
            NMS_THRESH: 0.1
            NMS_PRE_MAXSIZE: 4096
            NMS_POST_MAXSIZE: 500

OPTIMIZATION:
    BATCH_SIZE_PER_GPU: 2
    NUM_EPOCHS: 80

    OPTIMIZER: adam_onecycle
    LR: 0.003
    WEIGHT_DECAY: 0.01
    MOMENTUM: 0.9

    MOMS: [0.95, 0.85]
    PCT_START: 0.4
    DIV_FACTOR: 10
    DECAY_STEP_LIST: [35, 45]
    LR_DECAY: 0.1
    LR_CLIP: 0.0000001

    LR_WARMUP: False
    WARMUP_EPOCH: 1

    GRAD_NORM_CLIP: 10

