From 0d9d612aa7b7ebfe3695591933a94cb801d6ac69 Mon Sep 17 00:00:00 2001 From: DarkLight1337 Date: Thu, 26 Sep 2024 23:09:09 +0000 Subject: [PATCH 01/31] Remove unnecessary warning for missing `dummy_encoder_data_factory` --- vllm/inputs/registry.py | 12 ++---------- 1 file changed, 2 insertions(+), 10 deletions(-) diff --git a/vllm/inputs/registry.py b/vllm/inputs/registry.py index 159d958ebf67..eed86ea02713 100644 --- a/vllm/inputs/registry.py +++ b/vllm/inputs/registry.py @@ -185,16 +185,8 @@ def wrapper(model_cls: N) -> N: return wrapper def _get_dummy_encoder_data_factory(self, model_cls: Type[nn.Module]): - if model_cls in self._dummy_encoder_factories_by_model_type: - dummy_factory = self._dummy_encoder_factories_by_model_type[ - model_cls] - else: - logger.warning( - "No dummy encoder data factory registered to %s. " - "Using the dummy data factory for the model instead.", - model_cls) - dummy_factory = self._get_dummy_data_factory(model_cls) - return dummy_factory + return self._dummy_encoder_factories_by_model_type \ + .get(model_cls, self._default_dummy_data_factory) def dummy_data_for_profiling( self, From a93a4e111e81f3b2f3fa2bb2c15923ed901f79d5 Mon Sep 17 00:00:00 2001 From: DarkLight1337 Date: Thu, 26 Sep 2024 23:09:16 +0000 Subject: [PATCH 02/31] Actually test mllama --- .buildkite/test-pipeline.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index b4226a3ca574..48cfebb264b3 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -330,6 +330,7 @@ steps: commands: - pytest -v -s models/embedding/language - pytest -v -s models/encoder_decoder/language + - pytest -v -s models/encoder_decoder/vision_language ##### 1 GPU test ##### ##### multi gpus test ##### From 3241f706e76c23970ce4860dc6e286fad5d94246 Mon Sep 17 00:00:00 2001 From: DarkLight1337 Date: Fri, 27 Sep 2024 00:50:52 +0000 Subject: [PATCH 03/31] Use smaller model for llava_onevision and fix chat template --- .../vision_language/test_llava_onevision.py | 22 ++++++------------- 1 file changed, 7 insertions(+), 15 deletions(-) diff --git a/tests/models/decoder_only/vision_language/test_llava_onevision.py b/tests/models/decoder_only/vision_language/test_llava_onevision.py index 978631feacb8..6852244574a7 100644 --- a/tests/models/decoder_only/vision_language/test_llava_onevision.py +++ b/tests/models/decoder_only/vision_language/test_llava_onevision.py @@ -16,11 +16,10 @@ # Video test HF_VIDEO_PROMPTS = VIDEO_ASSETS.prompts({ "sample_demo_1": - "<|im_start|>user