diff --git a/vllm/worker/cpu_model_runner.py b/vllm/worker/cpu_model_runner.py index e3464c0d3900..148332f3402f 100644 --- a/vllm/worker/cpu_model_runner.py +++ b/vllm/worker/cpu_model_runner.py @@ -355,6 +355,7 @@ def prepare_model_input( input_positions=input_positions, attn_metadata=attn_metadata, sampling_metadata=sampling_metadata, + multi_modal_kwargs=multi_modal_kwargs, ) @torch.inference_mode()