From b9858f755598ca84e8f3981be71707aad7e1cead Mon Sep 17 00:00:00 2001 From: Mark McLoughlin Date: Mon, 10 Mar 2025 17:50:19 -0400 Subject: [PATCH] [WIP][V1][Structured Output] Enable structured output test Enable `tests/v1/entrypoints/llm/test_struct_output_generate.py` in CI. WIP while we debug why this somethimes fails with: ``` RuntimeError: Cannot re-initialize CUDA in forked subprocess. To use CUDA with multiprocessing, you must use the 'spawn' start method ``` The failure can be reproduced in some environments with: ``` VLLM_USE_V1=1 pytest -s -v 'tests/v1/entrypoints/llm/test_struct_output_generate.py::test_guided_grammar_ebnf[xgrammar]' 'tests/v1/entrypoints/llm/test_struct_output_generate.py::test_guided_grammar_lark[xgrammar]' ``` Signed-off-by: Mark McLoughlin --- .buildkite/test-pipeline.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index 2af76cb24dd1..56f641300113 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -202,6 +202,7 @@ steps: # split the test to avoid interference - VLLM_USE_V1=1 pytest -v -s v1/core - VLLM_USE_V1=1 pytest -v -s v1/engine + - VLLM_USE_V1=1 pytest -v -s v1/entrypoints/llm - VLLM_USE_V1=1 pytest -v -s v1/sample - VLLM_USE_V1=1 pytest -v -s v1/worker - VLLM_USE_V1=1 pytest -v -s v1/structured_output