File tree 1 file changed +8
-1
lines changed
python/ray/llm/tests/batch/gpu/stages
1 file changed +8
-1
lines changed Original file line number Diff line number Diff line change @@ -171,6 +171,9 @@ async def test_vllm_wrapper_semaphore(model_llama_3_2_216M):
171
171
patch (
172
172
"ray.llm._internal.batch.stages.vllm_engine_stage.vLLMEngineWrapper.generate_async_v0"
173
173
) as mock_generate_async_v0 ,
174
+ patch (
175
+ "ray.llm._internal.batch.stages.vllm_engine_stage.vLLMEngineWrapper.generate_async_v1"
176
+ ) as mock_generate_async_v1 ,
174
177
):
175
178
mock_engine .from_engine_args .return_value = AsyncMock ()
176
179
num_running_requests = 0
@@ -207,6 +210,7 @@ async def mock_generate(request):
207
210
)
208
211
209
212
mock_generate_async_v0 .side_effect = mock_generate
213
+ mock_generate_async_v1 .side_effect = mock_generate
210
214
211
215
# Create wrapper with max 2 pending requests
212
216
wrapper = vLLMEngineWrapper (
@@ -227,7 +231,10 @@ async def mock_generate(request):
227
231
await asyncio .gather (* tasks )
228
232
229
233
# Verify all requests were processed
230
- assert mock_generate_async_v0 .call_count == 10
234
+ assert (
235
+ mock_generate_async_v0 .call_count == 10
236
+ or mock_generate_async_v1 .call_count == 10
237
+ )
231
238
232
239
233
240
@pytest .mark .asyncio
You can’t perform that action at this time.
0 commit comments