We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3f30ef0 commit 590faf6Copy full SHA for 590faf6
recipe/deepeyes/deepeyes.py
@@ -78,8 +78,9 @@ def __getitem__(self, item):
78
multi_modal_data = {}
79
80
images = None
81
- if self.image_key in row_dict and row_dict.get(self.image_key, None) is not None:
82
- images = [Image.open(io.BytesIO(image["bytes"])) for image in row_dict.pop(self.image_key)]
+ row_dict_images = row_dict.pop(self.image_key, None)
+ if row_dict_images:
83
+ images = [Image.open(io.BytesIO(image["bytes"])) for image in row_dict_images]
84
85
# due to the image key is "image" instead of "images" in vllm, we need to use "image" here
86
# link: https://github.com/vllm-project/vllm/blob/3c545c0c3b98ee642373a308197d750d0e449403/vllm/multimodal/parse.py#L205 # noqa: E501
0 commit comments