File tree Expand file tree Collapse file tree 1 file changed +14
-0
lines changed
vllm/model_executor/models Expand file tree Collapse file tree 1 file changed +14
-0
lines changed Original file line number Diff line number Diff line change @@ -205,6 +205,19 @@ def verify_and_update_config(vllm_config: "VllmConfig") -> None:
205
205
}
206
206
207
207
208
+ class GraniteMoeHybridModelConfig (VerifyAndUpdateConfig ):
209
+
210
+ @staticmethod
211
+ def verify_and_update_config (vllm_config : "VllmConfig" ) -> None :
212
+ config = vllm_config .model_config
213
+ config .max_seq_len_to_capture = config .max_model_len
214
+ logger .info (
215
+ "Setting max_seq_len_to_capture to %d "
216
+ "to ensure that CUDA graph capture "
217
+ "covers sequences of length up to max_model_len." ,
218
+ config .max_model_len )
219
+
220
+
208
221
class HybridAttentionMambaModelConfig (VerifyAndUpdateConfig ):
209
222
210
223
@classmethod
@@ -297,4 +310,5 @@ def verify_and_update_config(cls, vllm_config: "VllmConfig") -> None:
297
310
"Qwen3ForSequenceClassification" : Qwen3ForSequenceClassificationConfig ,
298
311
"XLMRobertaModel" : JinaRobertaModelConfig ,
299
312
"JinaVLForRanking" : JinaVLForSequenceClassificationConfig ,
313
+ "GraniteMoeHybridForCausalLM" : GraniteMoeHybridModelConfig ,
300
314
}
You can’t perform that action at this time.
0 commit comments