diff --git a/xformers/ops/fmha/dispatch.py b/xformers/ops/fmha/dispatch.py index 642f535c1c..8c0086e09d 100644 --- a/xformers/ops/fmha/dispatch.py +++ b/xformers/ops/fmha/dispatch.py @@ -16,7 +16,7 @@ T = TypeVar("T", Type[AttentionFwOpBase], Type[AttentionBwOpBase]) -_USE_FLASH_ATTENTION_3 = False +_USE_FLASH_ATTENTION_3 = True def _set_use_fa3(use_flash_attention3: bool) -> None: