diff --git a/test/inductor/test_cuda_select_algorithm.py b/test/inductor/test_cuda_select_algorithm.py index f580aaa5a1d..7fd9fadc1cc 100644 --- a/test/inductor/test_cuda_select_algorithm.py +++ b/test/inductor/test_cuda_select_algorithm.py @@ -138,6 +138,7 @@ class TestSelectAlgorithmCuda(BaseTestSelectAlgorithm): @parametrize("in_features", (128,)) @parametrize("out_features", (64,)) @unittest.skipIf(not TEST_CUDA, "CUDA not available") + @unittest.skipIf(TEST_WITH_SLOW_GRADCHECK, "Leaking memory") def test_int8_woq_mm_concat_cuda( self, dtype, batch_size, mid_dim, in_features, out_features ):