Add llama test model to cover MQA (#585)

jiqing-feng · web-flow · commit f1984f4fe0b0 · 2024-03-06T11:08:32.000+01:00
* change llama test model to cover MQA

* keep llama and llama2 in tests

* fix code style
diff --git a/tests/generation/test_modeling.py b/tests/generation/test_modeling.py
@@ -31,6 +31,7 @@
     "gpt_neo": "hf-internal-testing/tiny-random-GPTNeoModel",
     "mistral": "echarlaix/tiny-random-mistral",
     "llama": "fxmarty/tiny-llama-fast-tokenizer",
+    "llama2": "Jiqing/tiny_random_llama2",
     "gpt_bigcode": "hf-internal-testing/tiny-random-GPTBigCodeModel",
 }
 
@@ -54,6 +55,7 @@ class ModelingIntegrationTest(unittest.TestCase):
         "gpt_neo",
         "mistral",
         "llama",
+        "llama2",
         # "gpt_bigcode",
     )
 
diff --git a/tests/ipex/test_inference.py b/tests/ipex/test_inference.py
@@ -42,6 +42,7 @@
     "gpt_neox": "hf-internal-testing/tiny-random-GPTNeoXForCausalLM",
     "gpt_bigcode": "hf-internal-testing/tiny-random-GPTBigCodeModel",
     "llama": "fxmarty/tiny-llama-fast-tokenizer",
+    "llama2": "Jiqing/tiny_random_llama2",
     "opt": "hf-internal-testing/tiny-random-OPTModel",
     "mpt": "hf-internal-testing/tiny-random-MptForCausalLM",
 }
@@ -66,6 +67,7 @@ class IPEXIntegrationTest(unittest.TestCase):
         "gpt_neo",
         # "gpt_bigcode",
         "llama",
+        "llama2",
         "opt",
         "mpt",
     )
diff --git a/tests/ipex/test_modeling.py b/tests/ipex/test_modeling.py
@@ -67,6 +67,7 @@
     "gptj": "hf-internal-testing/tiny-random-GPTJModel",
     "levit": "hf-internal-testing/tiny-random-LevitModel",
     "llama": "fxmarty/tiny-llama-fast-tokenizer",
+    "llama2": "Jiqing/tiny_random_llama2",
     "marian": "sshleifer/tiny-marian-en-de",
     "mbart": "hf-internal-testing/tiny-random-mbart",
     "mistral": "echarlaix/tiny-random-mistral",
@@ -209,6 +210,7 @@ class IPEXModelForCausalLMTest(unittest.TestCase):
         "gpt_neo",
         "gpt_neox",
         "llama",
+        "llama2",
         "mistral",
         # "phi",
         "mpt",
@@ -226,7 +228,9 @@ def test_compare_to_transformers(self, model_arch):
         self.assertTrue(ipex_model.use_cache)
         tokenizer = AutoTokenizer.from_pretrained(model_id)
         tokens = tokenizer(
-            "This is a sample", return_tensors="pt", return_token_type_ids=False if model_arch == "llama" else None
+            "This is a sample",
+            return_tensors="pt",
+            return_token_type_ids=False if model_arch in ("llama", "llama2") else None,
         )
         position_ids = None
         if model_arch.replace("_", "-") in MODEL_TYPES_REQUIRING_POSITION_IDS:

Original file line number	Diff line number	Diff line change
`@@ -31,6 +31,7 @@`
`31`	`31`	`"gpt_neo": "hf-internal-testing/tiny-random-GPTNeoModel",`
`32`	`32`	`"mistral": "echarlaix/tiny-random-mistral",`
`33`	`33`	`"llama": "fxmarty/tiny-llama-fast-tokenizer",`
	`34`	`+ "llama2": "Jiqing/tiny_random_llama2",`
`34`	`35`	`"gpt_bigcode": "hf-internal-testing/tiny-random-GPTBigCodeModel",`
`35`	`36`	`}`
`36`	`37`
`@@ -54,6 +55,7 @@ class ModelingIntegrationTest(unittest.TestCase):`
`54`	`55`	`"gpt_neo",`
`55`	`56`	`"mistral",`
`56`	`57`	`"llama",`
	`58`	`+ "llama2",`
`57`	`59`	`# "gpt_bigcode",`
`58`	`60`	`)`
`59`	`61`