ROCm · ipanfilo · Feb 5, 2026 · Feb 5, 2026 · wangye805 · Feb 9, 2026
@@ -18,10 +18,10 @@ sm_arch=`python3 -c "import torch; sm = torch.cuda.get_device_capability(0); pri
 export FLASH_ATTN_CUDA_ARCHS=$sm_arch
 if [ $sm_arch -gt 90 ]
 then
-  FA_versions=(2.8.1)
+  FA_versions=(2.8.3)
 elif [ $sm_arch -eq 90 ]
 then
-  FA_versions=(2.7.3 2.8.1 3.0.0b1)
+  FA_versions=(2.7.3 2.8.3 3.0.0b1)
 fi
 
 for fa_version in "${FA_versions[@]}"

@@ -375,6 +375,12 @@ def get_tols(config, module, backend, dtype):
                 torch.half: (5e-3, 5e-3),
                 torch.bfloat16: (3.5e-2, 3.5e-2),
             }
+            # With FA on ROCm it may not fit default tolerance
+            if IS_HIP_EXTENSION and backend == "FlashAttention":
+                tols = {
+                    torch.half: (5e-3, 5e-3),
+                    torch.bfloat16: (4e-2, 4e-2),
+                }
         else:
             if backend == "UnfusedAttention":
                 tols = {
@@ -389,7 +395,7 @@ def get_tols(config, module, backend, dtype):
             # With FA on ROCm it may not fit default tolerance
             if IS_HIP_EXTENSION and backend == "FlashAttention":
                 tols = {
-                    torch.half: (1e-2, 1e-2),
+                    torch.half: (1.2e-2, 1.2e-2),
                     torch.bfloat16: (1e-1, 1e-1),
                 }
     if module == "DotProductAttention":

@@ -1,5 +1,5 @@
 # This file was modified for portability to AMDGPU
-# Copyright (c) 2025, Advanced Micro Devices, Inc. All rights reserved.
+# Copyright (c) 2025-2026, Advanced Micro Devices, Inc. All rights reserved.
 # Copyright (c) 2022-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 #
 # See LICENSE for license information.
@@ -109,7 +109,7 @@ class FlashAttentionUtils:
     version = PkgVersion("0")
     version_required = PkgVersion("2.1.1")
     version_required_blackwell = PkgVersion("2.7.3")
-    max_version = PkgVersion("2.8.1")
+    max_version = PkgVersion("2.8.3")
     v2_plus = False
     v2_1_plus = False
     v2_3_plus = False