File tree Expand file tree Collapse file tree 2 files changed +9
-11
lines changed
vllm/model_executor/layers/fused_moe Expand file tree Collapse file tree 2 files changed +9
-11
lines changed Original file line number Diff line number Diff line change 5
5
import dataclasses
6
6
import importlib
7
7
import os
8
+ import socket
8
9
import traceback
10
+ from contextlib import closing
9
11
from typing import Callable , Optional
10
12
11
13
import torch
14
16
spawn ) # pyright: ignore[reportPrivateImportUsage]
15
17
from typing_extensions import Concatenate , ParamSpec
16
18
17
- from vllm .model_executor .layers .fused_moe .utils import find_free_port
18
-
19
19
has_deep_ep = importlib .util .find_spec ("deep_ep" ) is not None
20
20
if has_deep_ep :
21
21
from vllm .model_executor .layers .fused_moe .deepep_ht_prepare_finalize import ( # noqa: E501
@@ -82,6 +82,13 @@ def _worker_parallel_launch(
82
82
torch .distributed .destroy_process_group ()
83
83
84
84
85
+ def find_free_port ():
86
+ with closing (socket .socket (socket .AF_INET , socket .SOCK_STREAM )) as s :
87
+ s .bind (('' , 0 ))
88
+ s .setsockopt (socket .SOL_SOCKET , socket .SO_REUSEADDR , 1 )
89
+ return s .getsockname ()[1 ]
90
+
91
+
85
92
def parallel_launch (
86
93
world_size : int ,
87
94
worker : Callable [Concatenate [ProcessGroupInfo , P ], None ],
Original file line number Diff line number Diff line change 1
1
# SPDX-License-Identifier: Apache-2.0
2
2
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3
- import socket
4
- from contextlib import closing
5
3
from math import prod
6
4
from typing import Optional
7
5
@@ -101,13 +99,6 @@ def _fp8_perm(m: torch.Tensor, idx: torch.Tensor) -> torch.Tensor:
101
99
return m [idx , ...]
102
100
103
101
104
- def find_free_port ():
105
- with closing (socket .socket (socket .AF_INET , socket .SOCK_STREAM )) as s :
106
- s .bind (('' , 0 ))
107
- s .setsockopt (socket .SOL_SOCKET , socket .SO_REUSEADDR , 1 )
108
- return s .getsockname ()[1 ]
109
-
110
-
111
102
# TODO(bnell): better name
112
103
def maybe_fix_scales (scales : Optional [torch .Tensor ],
113
104
num_experts : int ) -> Optional [torch .Tensor ]:
You can’t perform that action at this time.
0 commit comments