diff --git a/vllm/worker/model_runner.py b/vllm/worker/model_runner.py index a1184ff2093b5..aed92bae20b6c 100644 --- a/vllm/worker/model_runner.py +++ b/vllm/worker/model_runner.py @@ -744,7 +744,7 @@ def _prepare_model_input_tensors( " Otherwise, the output might be wrong." " Set Flashinfer backend by " "export VLLM_ATTENTION_BACKEND=FLASHINFER.") - + if log_runner: print("Final tensors:") for name, tensor in [("input_tokens_tensor", input_tokens_tensor),