[CUTLASS][FP8] Skip scaled_mm rowwise test on sm89 (#133612)

Rowwise implementation currently uses sm90-specific features incl. TMA CC @drisspg Pull Request resolved: https://github.com/pytorch/pytorch/pull/133612 Approved by: https://github.com/Skylion007
2025-10-20 21:14:14 +08:00 · 2024-08-15 23:43:28 +00:00
parent 413416cf33
commit 7ad3108ef2
1 changed files with 2 additions and 0 deletions
--- a/test/test_matmul_cuda.py
+++ b/test/test_matmul_cuda.py
@ -16,6 +16,7 @@ from torch.quantization._quantized_conversions import (
 from torch.testing import make_tensor
 from torch.testing._internal.common_cuda import (
    SM53OrLater,
+    SM90OrLater,
    _get_torch_cuda_version,
    PLATFORM_SUPPORTS_FP8
 )
@ -664,6 +665,7 @@ class TestFP8MatmulCuda(TestCase):
            )

    @unittest.skipIf(not PLATFORM_SUPPORTS_FP8 or IS_WINDOWS, f8_msg)
+    @unittest.skipIf(not SM90OrLater, "rowwise implementation is currently sm90 specific")
    @skipIfRocm()
    @parametrize("base_dtype", [torch.bfloat16])
    def test_scaled_mm_vs_emulated_row_wise(self, base_dtype):