Simple code refactoring

christian-pinto · christian-pinto · commit d32de8aaeaec · 2025-06-27T08:48:10.000Z
- Remove unused functions
- merged functions not called anywhere else

Signed-off-by: Christian Pinto &lt;christian.pinto@ibm.com&gt;
diff --git a/vllm/v1/worker/gpu_model_runner.py b/vllm/v1/worker/gpu_model_runner.py
@@ -554,11 +554,16 @@ def _update_states(self, scheduler_output: "SchedulerOutput") -> None:
         if batch_changed or batch_reordered:
             self.input_batch.refresh_sampling_metadata()
 
-    def _add_multimodal_inputs_to_model_args(
+    def _maybe_add_multimodal_kwargs(
             self,
             model_kwargs: dict[str, Any],
-            scheduler_output: "SchedulerOutput",
-            num_reqs: int = -1):
+            scheduler_output: "SchedulerOutput" = None,
+            num_reqs: int = -1,
+    ):
+
+        if not self.model_supports_multimodal_raw_input:
+            return
+
         # Multi-modal data.
         if scheduler_output:
             multi_modal_kwargs_list = []
@@ -581,28 +586,7 @@ def _add_multimodal_inputs_to_model_args(
 
         model_kwargs.update(multi_modal_kwargs)
 
-    def _maybe_add_multimodal_kwargs(
-            self,
-            model_kwargs: dict[str, Any],
-            scheduler_output: "SchedulerOutput" = None,
-            num_reqs: int = -1):
-
-        if self.model_supports_multimodal_raw_input:
-            self._add_multimodal_inputs_to_model_args(model_kwargs,
-                                                      scheduler_output,
-                                                      num_reqs)
-
-    def _maybe_compute_attn_prefix(
-        self,
-        scheduler_output: "SchedulerOutput",
-    ) -> list[int]:
-        return [0] * len(self.kv_cache_config.kv_cache_groups)
-
-    def _maybe_prepare_additional_inputs(self,
-                                         scheduler_output: "SchedulerOutput",
-                                         token_indices: torch.Tensor):
-        pass
-
+ 
     def _get_cumsum_and_arange(
         self,
         num_tokens: np.ndarray,