
class GPTQProcessor(LoopProcessor):
    def __init__(
        self,
        tokenizer,
        qcfg: QuantizeConfig,
        calibration,
        prepare_dataset_func,
        calibration_concat_size: Optional[int],
        calibration_sort: Optional[str],
        batch_size: int,
        require_fwd: bool = True,
        calculate_w_wq_diff: bool = False,
        calibration_concat_separator: Optional[str] = None,
    ):

        super().__init__(
            tokenizer=tokenizer,
            qcfg=qcfg,
            calibration=calibration,
            calibration_concat_size=calibration_concat_size,
            calibration_sort=calibration_sort,
            calibration_concat_separator=calibration_concat_separator,
            prepare_dataset_func=prepare_dataset_func,
            batch_size=batch_size,
            require_fwd=require_fwd,
            fwd_after_process=True,
            subset_forward_early_stop=True,
        )

        self.calculate_w_wq_diff = calculate_w_wq_diff
        self.avg_losses = []

    # ... ... 


    def process(
        self,
        module: NamedModule,
        device: torch.device = None,
        subset: Optional[Dict[str, NamedModule]] = None,
        previous_subset: Optional[Dict[str, NamedModule]] = None,
        subset_index: Optional[int] = None,
        subset_total: Optional[int] = None,
    ):
        # ...
        # gptqmodel_5.6.0 
        # wq, q_scales, q_zeros, q_g_idx, duration, avg_loss, damp_percent, nsamples = g.quantize()

        # BPDQ
        c, B = None, None
        if self.qcfg.bpdq_flag:
            wq, q_scales, q_zeros, q_g_idx, duration, avg_loss, damp_percent, nsamples, c, B = g.quantize()
        else:
            wq, q_scales, q_zeros, q_g_idx, duration, avg_loss, damp_percent, nsamples = g.quantize()


        # ...
        # gptqmodel_5.6.0
        # with self.lock:
            # self.durations.append(duration)
            # self.avg_losses.append(avg_loss)
            # self.module_names.append(f"layer-{module.layer_index}-{module.name}")

        # BPDQ
        if c is not None and B is not None:
            c = c.to(CPU)
            B = B.to(CPU)
        with self.lock:
            self.durations.append(duration)
            self.avg_losses.append(avg_loss)
            self.module_names.append(f"layer-{module.layer_index}-{module.name}")
            if c is not None and B is not None:
                module.state.update({"my_c": c})
                module.state.update({"my_b": B})


    def submodule_finalize(self, module: NamedModule, model: BaseQModel, **kwargs):
        # ...
        # gptqmodel_5.6.0
            # q_zeros = module.state.pop("q_zeros").clone()
            # q_scales = module.state.pop("q_scales").clone()
            # q_g_idx = module.state.pop("q_g_idx").clone()

        # BPDQ
            my_c = module.state.pop("my_c", None)
            my_b = module.state.pop("my_b", None)



        # ...
        # gptqmodel_5.6.0
            # with parent_module_lock(parent_key):
            #     packer_label = pack_module(
            #         name=module.full_name,
            #         qModules=qModules,
            #         q_scales=q_scales,
            #         q_zeros=q_zeros,
            #         q_g_idx=q_g_idx,
            #         layers=layers,
            #         quant_linear_cls=model.qlinear_kernel,
            #         lock=self.lock,
            #         quantize_config=self.qcfg,
            #     )

        # BPDQ
            with parent_module_lock(parent_key):
                packer_label = pack_module(
                    name=module.full_name,
                    qModules=qModules,
                    q_scales=q_scales,
                    q_zeros=q_zeros,
                    q_g_idx=q_g_idx,
                    layers=layers,
                    quant_linear_cls=model.qlinear_kernel,
                    lock=self.lock,
                    quantize_config=self.qcfg,
                    my_c=my_c,
                    my_b=my_b
                )



