enable phi

jiqing-feng · jiqing-feng · commit 12ce691f718d · 2025-02-25T14:56:45.000Z
Signed-off-by: jiqing-feng &lt;jiqing.feng@intel.com&gt;
diff --git a/optimum/intel/ipex/modeling_base.py b/optimum/intel/ipex/modeling_base.py
@@ -317,6 +317,13 @@ def _reorder_cache(self, *args, **kwargs):
     def prepare_inputs_for_generation(self, *args, **kwargs):
         return self.model.prepare_inputs_for_generation(*args, **kwargs)
 
+    def _supports_num_logits_to_keep(self) -> bool:
+        """
+        Return True if the current model supports the keyword argument `num_logits_to_keep` in forward()
+        to save memory. Checking it in this way allows to avoid using a new model attribute.
+        """
+        return "num_logits_to_keep" in set(inspect.signature(self.model.forward).parameters.keys())
+
     def generate(self, *args, **kwargs):
         if self._add_patch and kwargs.get("assistant_model", None):
             raise ValueError(
@@ -427,6 +434,13 @@ def prepare_inputs_for_generation(self, *args, **kwargs):
     def get_encoder(self, *args, **kwargs):
         return self.model.get_encoder(*args, **kwargs)
 
+    def _supports_num_logits_to_keep(self) -> bool:
+        """
+        Return True if the current model supports the keyword argument `num_logits_to_keep` in forward()
+        to save memory. Checking it in this way allows to avoid using a new model attribute.
+        """
+        return "num_logits_to_keep" in set(inspect.signature(self.model.forward).parameters.keys())
+
     def _init_warmup(self):
         inputs = prepare_jit_inputs(self.model, self.export_feature, False)
         self.generate(input_ids=inputs["input_ids"], attention_mask=inputs["attention_mask"], max_new_tokens=4)
diff --git a/tests/ipex/test_modeling.py b/tests/ipex/test_modeling.py
@@ -239,7 +239,7 @@ class IPEXModelForCausalLMTest(unittest.TestCase):
         "mistral",
         "llama",
         "llama2",
-        # "phi",
+        "phi",
         "distilgpt2",
         "mpt",
         "opt",
diff --git a/tests/ipex/test_pipelines.py b/tests/ipex/test_pipelines.py
@@ -66,6 +66,7 @@ class PipelinesIntegrationTest(unittest.TestCase):
         "mistral",
         "mpt",
         "opt",
+        "phi",
         "qwen2",
     )
     QUESTION_ANSWERING_SUPPORTED_ARCHITECTURES = (

Original file line number	Diff line number	Diff line change
`@@ -66,6 +66,7 @@ class PipelinesIntegrationTest(unittest.TestCase):`
`66`	`66`	`"mistral",`
`67`	`67`	`"mpt",`
`68`	`68`	`"opt",`
	`69`	`+ "phi",`
`69`	`70`	`"qwen2",`
`70`	`71`	`)`
`71`	`72`	`QUESTION_ANSWERING_SUPPORTED_ARCHITECTURES = (`