add ut fot cv parallel

David9857 · David9857 · commit 8f2e33e9e1e0 · 2025-05-29T22:29:57.000+08:00
Signed-off-by: David9857 &lt;985700846@qq.com&gt;
diff --git a/tests/multicard/test_offline_inference_distributed.py b/tests/multicard/test_offline_inference_distributed.py
@@ -64,3 +64,29 @@ def test_models_distributed_DeepSeek():
             distributed_executor_backend="mp",
     ) as vllm_model:
         vllm_model.generate_greedy(example_prompts, max_tokens)
+
+
+@pytest.mark.skipif(os.getenv("VLLM_USE_V1") == "1",
+                    reason="deepseek v2 lite is not supported on v1")
+def test_models_distributed_DeepSeek_with_cv_parallel():
+    example_prompts = [
+        "vLLM is a high-throughput and memory-efficient inference and serving engine for LLMs.",
+        "Briefly describe the major milestones in the development of artificial intelligence from 1950 to 2020.",
+        "Compare and contrast artificial intelligence with human intelligence in terms of processing information.",
+    ]
+    dtype = "half"
+    max_tokens = 5
+    kwargs = {
+        'additional_config': {
+            'enable_graph_mode': True,
+            'enable_cv_parallel': True
+        }
+    }
+    with VllmRunner(
+            "deepseek-ai/DeepSeek-V2-Lite",
+            dtype=dtype,
+            tensor_parallel_size=4,
+            distributed_executor_backend="mp",
+            **kwargs
+    ) as vllm_model:
+        vllm_model.generate_greedy(example_prompts, max_tokens)