@@ -558,11 +558,16 @@ def _update_states(self, scheduler_output: "SchedulerOutput") -> None:
558
558
# Refresh batch metadata with any pending updates.
559
559
self .input_batch .refresh_metadata ()
560
560
561
- def _add_multimodal_inputs_to_model_args (
561
+ def _maybe_add_multimodal_kwargs (
562
562
self ,
563
563
model_kwargs : dict [str , Any ],
564
- scheduler_output : "SchedulerOutput" ,
565
- num_reqs : int = - 1 ):
564
+ scheduler_output : "SchedulerOutput" = None ,
565
+ num_reqs : int = - 1 ,
566
+ ):
567
+
568
+ if not self .model_supports_multimodal_raw_input :
569
+ return
570
+
566
571
# Multi-modal data.
567
572
if scheduler_output :
568
573
multi_modal_kwargs_list = []
@@ -585,28 +590,7 @@ def _add_multimodal_inputs_to_model_args(
585
590
586
591
model_kwargs .update (multi_modal_kwargs )
587
592
588
- def _maybe_add_multimodal_kwargs (
589
- self ,
590
- model_kwargs : dict [str , Any ],
591
- scheduler_output : "SchedulerOutput" = None ,
592
- num_reqs : int = - 1 ):
593
-
594
- if self .model_supports_multimodal_raw_input :
595
- self ._add_multimodal_inputs_to_model_args (model_kwargs ,
596
- scheduler_output ,
597
- num_reqs )
598
-
599
- def _maybe_compute_attn_prefix (
600
- self ,
601
- scheduler_output : "SchedulerOutput" ,
602
- ) -> list [int ]:
603
- return [0 ] * len (self .kv_cache_config .kv_cache_groups )
604
-
605
- def _maybe_prepare_additional_inputs (self ,
606
- scheduler_output : "SchedulerOutput" ,
607
- token_indices : torch .Tensor ):
608
- pass
609
-
593
+
610
594
def _get_cumsum_and_arange (
611
595
self ,
612
596
num_tokens : np .ndarray ,
0 commit comments