Skip to content

Commit 0253381

Browse files
authored
fix config (#2858)
1 parent 2d1184a commit 0253381

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

fastdeploy/config.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,6 +59,7 @@ class MoEPhase(Enum):
5959
"tie_word_embeddings":False,
6060
"rms_norm_eps":1e-5,
6161
"moe_num_experts": None,
62+
"moe_layer_end_index":None,
6263
}
6364

6465

@@ -330,7 +331,7 @@ def init_with_cudagrpah_size(
330331
if len(dedup_sizes) < len(self.cudagraph_capture_sizes):
331332
logger.info(("cudagraph sizes specified by model runner"
332333
" %s is overridden by config %s"),
333-
cudagraph_capture_sizes, dedup_sizes)
334+
self.cudagraph_capture_sizes, dedup_sizes)
334335
self.cudagraph_capture_sizes = dedup_sizes
335336

336337
# Sort to make sure cudagraph capture sizes are in descending order
@@ -351,7 +352,7 @@ def init_with_cudagrpah_size(
351352
self.max_capture_size] = self.max_capture_size
352353

353354
def _set_cudagraph_sizes(
354-
self,
355+
self,
355356
max_num_seqs:int = 0
356357
):
357358
"""

0 commit comments

Comments
 (0)