[Fix] Refine Checks for SDPA Availability (#4820)

Bobholamovic · Bobholamovic · commit 3fe80ebeca29 · 2025-12-11T03:46:03.000Z
* Do not use SDPA for SM120 GPUs

* Fix
diff --git a/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_siglip.py b/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_siglip.py
@@ -35,14 +35,19 @@
 
 # TODO: Weight initialization
 
+import platform
 from typing import List, Optional, Tuple, Union
 
 import numpy as np
 import paddle
 import paddle.nn as nn
 import paddle.nn.functional as F
 
-from ......utils.env import get_gpu_compute_capability
+from ......utils.env import (
+    get_device_type,
+    get_gpu_compute_capability,
+    get_paddle_cuda_version,
+)
 from ....common.vlm.activations import ACT2FN
 from ....common.vlm.transformers import PretrainedModel
 from ....common.vlm.transformers.model_outputs import (
@@ -139,7 +144,18 @@ def __init__(self, config):
         self.out_proj = nn.Linear(self.embed_dim, self.embed_dim)
 
         cap = get_gpu_compute_capability()
-        self._supports_sdpa = cap >= (8, 0) if cap is not None else False
+        cuda_ver = get_paddle_cuda_version()
+        self._supports_sdpa = False
+        if (
+            cap is not None
+            and cap >= (8, 0)
+            and cuda_ver is not None
+            and cuda_ver >= (11, 4)
+            and platform.system() == "Linux"
+        ):
+            self._supports_sdpa = True
+        if get_device_type() == "iluvatar_gpu":
+            self._supports_sdpa = True
 
     def forward(
         self,