diff --git a/fbgemm_gpu/experimental/gen_ai/test/quantize/quantize_test.py b/fbgemm_gpu/experimental/gen_ai/test/quantize/quantize_test.py index d34a78d41..4511fc965 100644 --- a/fbgemm_gpu/experimental/gen_ai/test/quantize/quantize_test.py +++ b/fbgemm_gpu/experimental/gen_ai/test/quantize/quantize_test.py @@ -106,7 +106,6 @@ def test_f8f8bf16(self, kernel: str, use_fast_accum: bool) -> None: ((not torch.version.cuda) and (not torch.version.hip)), "Skip if no GPU is present.", ) - @settings(deadline=None) def test_f8f8bf16_rowwise_simple(self) -> None: M = 128 N = 128 diff --git a/fbgemm_gpu/fbgemm_gpu/sparse_ops.py b/fbgemm_gpu/fbgemm_gpu/sparse_ops.py index 2cbc1af1c..c43053a03 100644 --- a/fbgemm_gpu/fbgemm_gpu/sparse_ops.py +++ b/fbgemm_gpu/fbgemm_gpu/sparse_ops.py @@ -523,7 +523,7 @@ def batch_index_select_dim0_abstract( return inputs.new_empty([output_numel]) -@torch.library.impl_abstract("fbgemm::batch_index_select_dim0_tensor") +@impl_abstract("fbgemm::batch_index_select_dim0_tensor") def batch_index_select_dim0_tensor_abstract( inputs: torch.Tensor, indices: torch.Tensor, @@ -576,7 +576,7 @@ def batch_index_select_dim0_forward_cuda_impl_abstract( ] -@torch.library.impl_abstract("fbgemm::batch_index_select_dim0_tensor_forward_cuda_impl") +@impl_abstract("fbgemm::batch_index_select_dim0_tensor_forward_cuda_impl") def batch_index_select_dim0_tensor_forward_cuda_impl_abstract( inputs: torch.Tensor, indices: torch.Tensor, @@ -605,9 +605,7 @@ def batch_index_select_dim0_tensor_forward_cuda_impl_abstract( ] -@torch.library.impl_abstract( - "fbgemm::batch_index_select_dim0_tensor_backward_cuda_impl" -) +@impl_abstract("fbgemm::batch_index_select_dim0_tensor_backward_cuda_impl") def batch_index_select_dim0_tensor_backward_cuda_impl_abstract( grad_output: torch.Tensor, dev_weights: torch.Tensor, @@ -671,7 +669,7 @@ def keyed_jagged_index_select_dim1_abstract( return ret -@torch.library.impl_abstract("fbgemm::batch_index_select_dim0_backward_cuda_impl") +@impl_abstract("fbgemm::batch_index_select_dim0_backward_cuda_impl") def batch_index_select_dim0_backward_cuda_impl_abstract( grad_output: torch.Tensor, dev_weights: torch.Tensor,