fix gemv test on avx512bf16 cpu (#1956)

matthewdouglas · web-flow · commit 857b83d9bbd0 · 2026-05-26T16:07:03.000-04:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -101,6 +101,7 @@ markers = [
     "deprecated: mark test as covering a deprecated feature",
     "slow: mark test as slow",
 ]
+testpaths = ["tests"]
 
 [tool.ruff]
 src = [
diff --git a/tests/test_functional.py b/tests/test_functional.py
@@ -807,14 +807,20 @@ def test_gemv_4bit(self, device, dim, dtype, storage_type, double_quant, kind):
                 compress_statistics=double_quant,
                 quant_storage=quant_storage,
             )
+
+            # dequant+F.linear reference path.
+            C1 = torch.nn.functional.linear(A, F.dequantize_4bit(qB, state).to(dtype))
+
+            # original matmul reference path.
             C3 = torch.matmul(A, B.t())
+
             # CPU requires convert weight packed for gemv
             if device == "cpu" and F.has_avx512bf16():
                 qB, state = F._convert_weight_packed_for_cpu(qB, state)
                 qB = qB.t()
+
+            # GEMV test
             C2 = F.gemv_4bit(A, qB.t(), state=state)
-            # dequant+F.linear reference path
-            C1 = torch.nn.functional.linear(A, F.dequantize_4bit(qB, state).to(dtype))
 
             err1 = (C1 - C2).abs().float()
             err2 = (C3 - C2).abs().float()

Original file line number	Diff line number	Diff line change
`@@ -101,6 +101,7 @@ markers = [`
`101`	`101`	`"deprecated: mark test as covering a deprecated feature",`
`102`	`102`	`"slow: mark test as slow",`
`103`	`103`	`]`
	`104`	`+testpaths = ["tests"]`
`104`	`105`
`105`	`106`	`[tool.ruff]`
`106`	`107`	`src = [`