Skip to content

Commit 0a1ddd2

Browse files
committed
chore: refine the init optins of datadist
Signed-off-by: Jade Zheng <zheng.shoujian@outlook.com>
1 parent d967a87 commit 0a1ddd2

File tree

1 file changed

+4
-7
lines changed

1 file changed

+4
-7
lines changed

vllm_ascend/distributed/llmdatadist_connector_v1.py

Lines changed: 4 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -290,18 +290,15 @@ def __init__(self, role: llm_datadist.LLMRole, local_rank: int,
290290
self.role, self.cluster_id)
291291

292292
def prepare_data_dist(self):
293+
# TODO: The maximum size of the mbuf for the llm datadist. We need to
294+
# find an appropriate value to minimize memory waste.
293295
options = {
294296
"llm.SyncKvCacheWaitTime": envs.LLMDATADIST_SYNC_CACHE_WAIT_TIME,
297+
"ge.flowGraphMemMaxSize": f"{(9*1024*1024*1024):d}",
298+
"ge.exec.deviceId": str(self.local_rank),
295299
}
296300
if self.role == llm_datadist.LLMRole.PROMPT:
297-
# TODO: This represents the maximum size of the mbuf for the llm
298-
# datadist. We need to find an appropriate value to minimize memory
299-
# waste.
300-
# options["ge.flowGraphMemMaxSize"] = "1024" # MB
301-
options["ge.exec.deviceId"] = str(self.local_rank)
302301
options["llm.listenIpInfo"] = f"{self.local_device_ip}:26000"
303-
else:
304-
options["ge.exec.deviceId"] = str(self.local_rank)
305302
self.datadist_engine.init(options)
306303
self.kv_transfer = self.datadist_engine.kv_cache_manager
307304

0 commit comments

Comments
 (0)