diff --git a/vllm/multimodal/image.py b/vllm/multimodal/image.py index d3a230e40477e..7ca64152e481a 100644 --- a/vllm/multimodal/image.py +++ b/vllm/multimodal/image.py @@ -56,7 +56,12 @@ def _default_input_mapper( .preprocess(data, return_tensors="pt") \ .data except Exception: - logger.error("Failed to process image (%s)", data) + logger.error( + "Failed to process image (%s) with the default mapper. " + "This is most likely an edge-case with this model's image " + "processor in transformers (type: %s), and not vLLM.", + data, + type(image_processor).__name__) raise return MultiModalInputs(batch_data)