[Bugfix][CPU] Fix InputBatch for pooling models in the CPU v1 (#20014)

Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
Li, Jiang
2025-06-24 21:20:04 +08:00
committed by GitHub
parent 9a3b88328f
commit 53da4cd397
2 changed files with 5 additions and 1 deletions

View File

@ -101,4 +101,4 @@ def test_prm_models(
hf_output = torch.tensor(hf_output)
vllm_output = torch.tensor(vllm_output)
assert torch.allclose(hf_output, vllm_output, 1e-2)
assert torch.allclose(hf_output, vllm_output, 1.5e-2)