From 62562ad82d3707fdc452b8febf2d85f3a6df34b4 Mon Sep 17 00:00:00 2001 From: Chengji Yao Date: Thu, 24 Jul 2025 18:34:05 +0000 Subject: [PATCH] [TPU][Bugfix] fix OOM issue in CI test Signed-off-by: Chengji Yao --- tests/v1/tpu/test_basic.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/v1/tpu/test_basic.py b/tests/v1/tpu/test_basic.py index b9ee9d66a38f..d2baba8818fb 100644 --- a/tests/v1/tpu/test_basic.py +++ b/tests/v1/tpu/test_basic.py @@ -58,7 +58,7 @@ def test_basic( # actually test chunked prompt max_num_batched_tokens=1024, max_model_len=8192, - gpu_memory_utilization=0.7, + gpu_memory_utilization=0.95, max_num_seqs=max_num_seqs, tensor_parallel_size=tensor_parallel_size) as vllm_model: vllm_outputs = vllm_model.generate_greedy(example_prompts,