    def __init__(self,
                 bits: int,
                 group_size: int,
                 desc_act: bool,
                 sym: bool,
                 in_features: int,
                 out_features: int,
                 bias: bool,
                 pack_dtype: t.dtype,
                 backend: BACKEND,
                 adapter: Adapter,
                 name: str = None,
                 register_buffers: bool = False,
                 register_buffers_in_features: int = None,
                 register_buffers_out_features: int = None,
                 **kwargs):
        super().__init__()


        # ...
        # gptqmodel_5.6.0 


        # store qzero format
        self._qzeros_format = 1 # only valid values are 1 and 2 for GPTQ v1 GPTQ v2

        # NOTE BPDQ
        # vvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvv
        self.bpdq_flag = kwargs.get("bpdq_flag", False)
        self.bpdq_k_bits = kwargs.get("bpdq_k_bits", 0) 
        # ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
        # NOTE BPDQ




        # ...
        # gptqmodel_5.6.0 
        # # most kernels share same buffers so they can share same register buffer code
        # if register_buffers:
        #     # some kernels auto-pads in/out features
        #     in_features = self.in_features if not register_buffers_in_features else register_buffers_in_features
        #     out_features = self.out_features if not register_buffers_out_features else register_buffers_out_features

        #     self.register_buffer(
        #         "qweight",
        #         t.zeros((in_features // self.pack_dtype_bits * self.bits, out_features), dtype=self.pack_dtype),
        #     )
        #     self.register_buffer(
        #         "qzeros",
        #         t.zeros(
        #             (
        #                 math.ceil(in_features / self.group_size),
        #                 out_features // self.pack_dtype_bits * self.bits,
        #             ),
        #             dtype=self.pack_dtype,
        #         ),
        #     )
        #     self.register_buffer(
        #         "scales",
        #         t.zeros(
        #             (math.ceil(in_features / self.group_size), out_features),
        #             dtype=t.float16,
        #         ),
        #     )
        #     self.register_buffer(
        #         "g_idx",
        #         t.tensor([i // self.group_size for i in range(in_features)], dtype=t.int32),
        #     )
        #     if bias:
        #         self.register_buffer("bias", t.zeros(out_features, dtype=t.float16))
        #     else:
        #         self.bias = None


        # NOTE BPDQ
        # most kernels share same buffers so they can share same register buffer code
        if register_buffers:
            # some kernels auto-pads in/out features
            in_features = self.in_features if not register_buffers_in_features else register_buffers_in_features
            out_features = self.out_features if not register_buffers_out_features else register_buffers_out_features

            if self.bpdq_flag:
                log.debug(f"Registering BPDQ buffers (c, B) for {self.name} [LUT-GEMM Layout]")
                
                k = self.bpdq_k_bits
                if k == 0:
                    raise ValueError("bpdq_k_bits is 0, but bpdq_flag is True.")
                
                if in_features % 32 != 0:
                     raise ValueError(f"in_features ({in_features}) must be divisible by 32 for LUT-GEMM int32 packing.")

                # Num_Groups
                num_column_groups = math.ceil(in_features / self.group_size)
                # Shape: [Groups, Bits+1, Out_Features]
                c_shape = (num_column_groups, k + 1, out_features)
                
                if self.group_size == 256 and (in_features % 256 != 0):
                    in_features = ((in_features + 256 - 1) // 256) * 256 
                b_shape = (in_features // 32, k, out_features)

                
                # c: float16
                self.register_buffer("c", t.zeros(c_shape, dtype=t.float16))
                # B: int32 
                self.register_buffer("B", t.zeros(b_shape, dtype=t.int32))

                self.qweight = None
                self.qzeros  = None
                self.scales  = None
                self.g_idx   = None

                # NOTE qween2.5-7b, has linear bias
                if bias:
                    self.register_buffer("bias", t.zeros(out_features, dtype=t.float16))
                else:
                    self.bias = None    


            else:
                self.register_buffer(
                    "qweight",
                    t.zeros((in_features // self.pack_dtype_bits * self.bits, out_features), dtype=self.pack_dtype),
                )
                self.register_buffer(
                    "qzeros",
                    t.zeros(
                        (
                            math.ceil(in_features / self.group_size),
                            out_features // self.pack_dtype_bits * self.bits,
                        ),
                        dtype=self.pack_dtype,
                    ),
                )
                self.register_buffer(
                    "scales",
                    t.zeros(
                        (math.ceil(in_features / self.group_size), out_features),
                        dtype=t.float16,
                    ),
                )
                self.register_buffer(
                    "g_idx",
                    t.tensor([i // self.group_size for i in range(in_features)], dtype=t.int32),
                )
                if bias:
                    self.register_buffer("bias", t.zeros(out_features, dtype=t.float16))
                else:
                    self.bias = None
        # NOTE BPDQ





    def list_buffers(self) -> List:
        buf = []
        if hasattr(self, "qweight") and self.qweight is not None:
            buf.append(self.qweight)
        if hasattr(self, "qzeros") and self.qzeros is not None:
            buf.append(self.qzeros)
        if hasattr(self, "scales") and self.scales is not None:
            buf.append(self.scales)
        if hasattr(self, "g_idx") and self.g_idx is not None:
            buf.append(self.g_idx)
        if hasattr(self, "bias") and self.bias is not None:
            buf.append(self.bias)
        # NOTE BPDQ
        if hasattr(self, "c") and self.c is not None:
            buf.append(self.c)
        if hasattr(self, "B") and self.B is not None:
            buf.append(self.B)
        # NOTE BPDQ



    # NOTE BPDQ
    def _infer_buffer_device(self) -> t.device:
        if hasattr(self, "g_idx") and isinstance(self.g_idx, t.Tensor):
            return self.g_idx.device
        for buf in self.list_buffers():
            if isinstance(buf, t.Tensor):
                return buf.device
        return t.device("cpu")
    # NOTE BPDQ


    def pack_original(self, linear: nn.Module, scales: t.Tensor, zeros: t.Tensor, g_idx: t.Tensor=None,
                        # NOTE BPDQ
                        my_c: Optional[t.Tensor] = None, my_b: Optional[t.Tensor] = None
                        # NOTE BPDQ
                      ):
# NOTE BPDQ
        with THREADPOOLCTL.threadpool_limits(1):

            if my_c is not None and my_b is not None:
                log.debug(f"Packing {self.name} using BPDQ (c/B) path.")
                
                self.register_buffer("c", my_c)
                self.register_buffer("B", my_b)
                
                self.register_buffer("g_idx", g_idx if g_idx is not None else self.g_idx)


                if linear.bias is not None:
                    b = linear.bias.detach().to(device="cpu", dtype=t.float16).contiguous()
                    if isinstance(getattr(self, "_buffers", None), dict) and isinstance(self._buffers.get("bias", None), t.Tensor):
                        self._buffers["bias"].copy_(b)
                    else:
                        self.register_buffer("bias", b)
                else:
                    if isinstance(getattr(self, "_buffers", None), dict):
                        self._buffers.pop("bias", None)
                    self.bias = None
                
            else:  
                # NOTE gptqmodel_5.6.0
# NOTE BPDQ



    def list_buffers(self) -> List:
        buf = []
        if hasattr(self, "qweight") and self.qweight is not None:
            buf.append(self.qweight)
        if hasattr(self, "qzeros") and self.qzeros is not None:
            buf.append(self.qzeros)
        if hasattr(self, "scales") and self.scales is not None:
            buf.append(self.scales)
        if hasattr(self, "bias") and self.bias is not None:
            buf.append(self.bias)
# NOTE BPDQ
        if hasattr(self, "c") and self.c is not None:
            buf.append(self.c)
        if hasattr(self, "B") and self.B is not None:
            buf.append(self.B)
# NOTE BPDQ
        return buf
