fix a bug after transformer upgrate

xinhe3 · xinhe3 · commit 5d7667aadf3e · 2025-02-17T10:02:23.000+02:00
Signed-off-by: Xin He &lt;xinhe3@habana.ai&gt;
diff --git a/neural_compressor/torch/algorithms/weight_only/gptq.py b/neural_compressor/torch/algorithms/weight_only/gptq.py
@@ -391,7 +391,8 @@ def forward(layer, *args, **kwargs):
             for arg in kwargs:
                 # TODO: investigate include parameters
                 # each outputs can be different shape, hence also use list to store
-                if isinstance(kwargs[arg], torch.Tensor) or arg == "alibi":
+                # position_embeddings is a list of two tensors in llama, handle it specially.
+                if isinstance(kwargs[arg], torch.Tensor) or arg in ["alibi", "position_embeddings"]:
                     if self.cache_key_arguments.get(arg, None) is None:
                         self.cache_key_arguments[arg] = []
                     self.cache_key_arguments[arg].append(kwargs[arg])