From 80b94da0610501bbe7142faeff0e2883703e206b Mon Sep 17 00:00:00 2001 From: NickLucche Date: Fri, 31 Jan 2025 19:11:52 +0000 Subject: [PATCH 1/2] f16 test Signed-off-by: NickLucche --- tests/spec_decode/e2e/test_integration_dist_tp2.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/spec_decode/e2e/test_integration_dist_tp2.py b/tests/spec_decode/e2e/test_integration_dist_tp2.py index 7001ee4c007f..7dba5cf10bfc 100644 --- a/tests/spec_decode/e2e/test_integration_dist_tp2.py +++ b/tests/spec_decode/e2e/test_integration_dist_tp2.py @@ -78,7 +78,7 @@ def test_target_model_tp_gt_1(common_llm_kwargs, per_test_common_llm_kwargs, # precision "--dtype", - "bfloat16", + "float16", ]]) @pytest.mark.parametrize("per_test_common_llm_kwargs", [[]]) @pytest.mark.parametrize("baseline_llm_kwargs", [[]]) From 9e966e7a01e28e595488139305ba28d58a7e4c03 Mon Sep 17 00:00:00 2001 From: NickLucche Date: Fri, 31 Jan 2025 19:22:14 +0000 Subject: [PATCH 2/2] re-add flaky test to suite Signed-off-by: NickLucche --- .buildkite/test-pipeline.yaml | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index d5d02fdeb7f4..a6fa4c77c813 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -488,9 +488,7 @@ steps: - pytest models/encoder_decoder/language/test_bart.py -v -s -m 'distributed(num_gpus=2)' - pytest models/encoder_decoder/vision_language/test_broadcast.py -v -s -m 'distributed(num_gpus=2)' - pytest models/decoder_only/vision_language/test_models.py -v -s -m 'distributed(num_gpus=2)' - # this test fails consistently. - # TODO: investigate and fix - # - pytest -v -s spec_decode/e2e/test_integration_dist_tp2.py + - pytest -v -s spec_decode/e2e/test_integration_dist_tp2.py - CUDA_VISIBLE_DEVICES=0,1 pytest -v -s test_sharded_state_loader.py - CUDA_VISIBLE_DEVICES=0,1 pytest -v -s kv_transfer/disagg_test.py