@@ -561,11 +561,16 @@ def _update_states(self, scheduler_output: "SchedulerOutput") -> None:
561
561
# Refresh batch metadata with any pending updates.
562
562
self .input_batch .refresh_metadata ()
563
563
564
- def _add_multimodal_inputs_to_model_args (
564
+ def _maybe_add_multimodal_kwargs (
565
565
self ,
566
566
model_kwargs : dict [str , Any ],
567
- scheduler_output : "SchedulerOutput" ,
568
- num_reqs : int = - 1 ):
567
+ scheduler_output : "SchedulerOutput" = None ,
568
+ num_reqs : int = - 1 ,
569
+ ):
570
+
571
+ if not self .model_supports_multimodal_raw_input :
572
+ return
573
+
569
574
# Multi-modal data.
570
575
if scheduler_output :
571
576
multi_modal_kwargs_list = []
@@ -588,28 +593,7 @@ def _add_multimodal_inputs_to_model_args(
588
593
589
594
model_kwargs .update (multi_modal_kwargs )
590
595
591
- def _maybe_add_multimodal_kwargs (
592
- self ,
593
- model_kwargs : dict [str , Any ],
594
- scheduler_output : "SchedulerOutput" = None ,
595
- num_reqs : int = - 1 ):
596
-
597
- if self .model_supports_multimodal_raw_input :
598
- self ._add_multimodal_inputs_to_model_args (model_kwargs ,
599
- scheduler_output ,
600
- num_reqs )
601
-
602
- def _maybe_compute_attn_prefix (
603
- self ,
604
- scheduler_output : "SchedulerOutput" ,
605
- ) -> list [int ]:
606
- return [0 ] * len (self .kv_cache_config .kv_cache_groups )
607
-
608
- def _maybe_prepare_additional_inputs (self ,
609
- scheduler_output : "SchedulerOutput" ,
610
- token_indices : torch .Tensor ):
611
- pass
612
-
596
+
613
597
def _get_cumsum_and_arange (
614
598
self ,
615
599
num_tokens : np .ndarray ,
0 commit comments