Add update_g_idx flag for setting qweight&g_idx (#2143)

Kaihui-intel · pre-commit-ci[bot] · XuehaoSun · web-flow · commit c4a8c77c7966 · 2025-04-21T13:08:25.000+08:00
Signed-off-by: Kaihui-intel &lt;kaihui.tang@intel.com&gt;
Co-authored-by: pre-commit-ci[bot] &lt;66853113+pre-commit-ci[bot]@users.noreply.github.com&gt;
Co-authored-by: Sun, Xuehao &lt;xuehao.sun@intel.com&gt;
diff --git a/neural_compressor/transformers/quantization/utils.py b/neural_compressor/transformers/quantization/utils.py
@@ -238,9 +238,16 @@ def _replace_linear(
                             dtype=torch.int32,
                             device=torch.device(device),
                         )
+
+                    # Note: update_g_idx is only applicable for ipex versions >=2.7
                     model._modules[name].set_weights_bias(
                         module.qweight.data if hasattr(module, "qweight") else weight,
                         None if module.bias is None else module.bias.data,
+                        **(
+                            {"update_g_idx": not empty_weights}
+                            if "update_g_idx" in model._modules[name].set_weights_bias.__code__.co_varnames
+                            else {}
+                        ),
                     )
                 else:
                     raise Exception("{} device Unsupported weight only quantization!".format(device))