diff --git a/vllm/worker/cpu_model_runner.py b/vllm/worker/cpu_model_runner.py index a4411c5b78347..a3dc57574d1e0 100644 --- a/vllm/worker/cpu_model_runner.py +++ b/vllm/worker/cpu_model_runner.py @@ -358,6 +358,7 @@ def prepare_model_input( input_positions=input_positions, attn_metadata=attn_metadata, sampling_metadata=sampling_metadata, + multi_modal_kwargs=multi_modal_kwargs, ) @torch.inference_mode()