fix bug of FusedMoE object has no attribute w13_weight (#94)

yuwenzho · web-flow · commit 370cc68543c5 · 2025-01-05T11:06:53.000+02:00
Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;
diff --git a/neural_compressor/torch/algorithms/fp8_quant/_quant_common/helper_modules.py b/neural_compressor/torch/algorithms/fp8_quant/_quant_common/helper_modules.py
@@ -14,6 +14,7 @@
 
 import torch
 import torch.nn as nn
+import types
 
 from .quant_config import QuantMode, get_hqt_config, ScaleFormat
 from .._core.quant_dequant import QuantDequant as qdq
@@ -294,6 +295,8 @@ def __init__(self, mod, mod_extra_config, *args, **kwargs):
         if self.quantization_mode in [QuantMode.QUANTIZE, QuantMode.LOAD]:
             delattr(mod, "w13_weight")
             delattr(mod, "w2_weight")
+            setattr(mod, "w13_weight", None)
+            setattr(mod, "w2_weight", None)
             setattr(self, "w13_weight", None)
             setattr(self, "w2_weight", None)
         self.forward = self.forward_orig