Skip to content

Commit 8b31e79

Browse files
committed
fix bugs in forward_end
1 parent edb38e4 commit 8b31e79

File tree

1 file changed

+10
-7
lines changed

1 file changed

+10
-7
lines changed

vllm_ascend/eplb/eplb_updator.py

Lines changed: 10 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -130,14 +130,17 @@ def forward_before(self):
130130
self.reqs = []
131131
self.eplb_loader.asyn_expert_weight_transfer(self.reqs)
132132

133-
def forward_end(self, dummy_run=False):
133+
def forward_end(self,dummy_run=False):
134134
self.adaptor.get_rank_expert_workload(self.num_moe_layers,dummy_run)
135-
if not self.update_in_flight and self.get_update_iteration():
136-
moe_load = self.compute_and_set_moe_load(dummy_run)
137-
self.wakeup_eplb_worker()
138-
self.update_in_flight = True
139-
self.wait_worker_iterations = 0
140-
self.weight_loading = False
135+
if not self.update_in_flight:
136+
load_gather_iteration, update_iteration = self.get_update_iteration()
137+
if load_gather_iteration:
138+
moe_load = self.compute_and_set_moe_load(dummy_run)
139+
if update_iteration:
140+
self.wakeup_eplb_worker()
141+
self.update_in_flight = True
142+
self.wait_worker_iterations = 0
143+
self.weight_loading = False
141144

142145
if self.update_in_flight:
143146
self.wait_worker_iterations = self.wait_worker_iterations + 1

0 commit comments

Comments
 (0)