vllm-project
diff --git a/‎.github/workflows/vllm_ascend_test.yaml
Lines changed: 2 additions & 1 deletion b/‎.github/workflows/vllm_ascend_test.yaml
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/conftest.py
Lines changed: 14 additions & 1 deletion b/‎tests/conftest.py
Lines changed: 14 additions & 1 deletion
@@ -148,7 +148,8 @@ jobs:
       - name: Run vllm-project/vllm-ascend key feature test
         if: steps.filter.outputs.speculative_tests_changed
         run: |
-          pytest -sv tests/spec_decode
+          pytest -sv tests/spec_decode/e2e/test_mtp_correctness.py
+          pytest -sv tests/spec_decode --ignore=tests/spec_decode/e2e/test_mtp_correctness.py 
 
       - name: Run vllm-project/vllm test
         run: |
 
@@ -17,14 +17,18 @@
 # limitations under the License.
 #
 
+import contextlib
+import gc
 from typing import List, Optional, Tuple, TypeVar, Union
 
 import numpy as np
 import pytest
+import torch
 from PIL import Image
 from vllm import LLM, SamplingParams
 from vllm.config import TaskOption
-from vllm.distributed import cleanup_dist_env_and_memory
+from vllm.distributed import (destroy_distributed_environment,
+                              destroy_model_parallel)
 from vllm.inputs import ExplicitEncoderDecoderPrompt, TextPrompt, TokensPrompt
 from vllm.logger import init_logger
 from vllm.outputs import RequestOutput
@@ -44,6 +48,15 @@
 PromptVideoInput = _PromptMultiModalInput[np.ndarray]
 
 
+def cleanup_dist_env_and_memory():
+    destroy_model_parallel()
+    destroy_distributed_environment()
+    with contextlib.suppress(AssertionError):
+        torch.distributed.destroy_process_group()
+    gc.collect()
+    torch.npu.empty_cache()
+
+
 class VllmRunner:
 
     def __init__(