Skip to content

Commit b408e85

Browse files
authored
Update model_runner_v1.py
1 parent a4049ad commit b408e85

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

vllm_ascend/worker/model_runner_v1.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1167,16 +1167,15 @@ def load_model(self) -> None:
11671167

11681168
with DeviceMemoryProfiler() as m: # noqa: SIM117
11691169
self.model = get_model(vllm_config=self.vllm_config)
1170+
if hasattr(self, "drafter"):
1171+
logger.info("Loading drafter model...")
1172+
self.drafter.load_model(self.model)
11701173
if self.lora_config:
11711174
self.model = self.load_lora_model(self.model,
11721175
self.model_config,
11731176
self.scheduler_config,
11741177
self.lora_config,
11751178
self.device)
1176-
1177-
if hasattr(self, "drafter"):
1178-
logger.info("Loading drafter model...")
1179-
self.drafter.load_model(self.model)
11801179
logger.info("Loading model weights took %.4f GB",
11811180
m.consumed_memory / float(2**30))
11821181

0 commit comments

Comments
 (0)