From d681af3fed5f974387393a809d3445f2b324f8c1 Mon Sep 17 00:00:00 2001 From: Mitch Lewis Date: Tue, 13 Jan 2026 18:52:27 -0700 Subject: [PATCH] Revert "[Bugfix][CI/Build] Fix failing pooling models test due to Triton kernel accuracy diff (#31776)" This reverts commit ee2e69d6cda898736cc2987cb8cdfaa2601c1375. --- tests/models/language/pooling/test_token_classification.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/models/language/pooling/test_token_classification.py b/tests/models/language/pooling/test_token_classification.py index b84f05ae3099..341df02e74ef 100644 --- a/tests/models/language/pooling/test_token_classification.py +++ b/tests/models/language/pooling/test_token_classification.py @@ -78,7 +78,7 @@ def test_modernbert_models( for hf_output, vllm_output in zip(hf_outputs, vllm_outputs): hf_output = hf_output.detach().clone().cpu().float() vllm_output = vllm_output.detach().clone().cpu().float() - torch.testing.assert_close(hf_output, vllm_output, atol=1.2e-2, rtol=1e-3) + assert torch.allclose(hf_output, vllm_output, atol=1e-2) @pytest.mark.parametrize("model", ["bd2lcco/Qwen3-0.6B-finetuned"])