Revert "test: skip cuda tests when sglang import fails"

gufengc · gufengc · commit 9e261235675d · 2026-05-30T00:10:43.000+08:00
This reverts commit c5bc7e3.
diff --git a/tests/test_model_cuda.py b/tests/test_model_cuda.py
@@ -16,16 +16,11 @@
 # Delay import of SGLExecutor to avoid import errors when sglang is not available
 # This allows test collection to succeed even if sglang is not installed
 SGLExecutor = None
-SGL_EXECUTOR_IMPORT_ERROR = None
 try:
     from parallax.server.executor.sglang_executor import SGLExecutor
-except ImportError as exc:
+except ImportError:
     # sglang not available, tests will be skipped
-    SGL_EXECUTOR_IMPORT_ERROR = exc
-except Exception as exc:
-    if is_cuda_available():
-        raise
-    SGL_EXECUTOR_IMPORT_ERROR = exc
+    pass
 
 CUDA_MODEL_REPO = "Qwen/Qwen3-0.6B"
 TOTAL_LAYERS = 28
@@ -69,10 +64,7 @@ def test_cuda_shard_prefill(layers_config: List[Tuple[int, int]], ref_model_and_
     but uses parallax's SGLExecutor instead of direct model loading.
     """
     if SGLExecutor is None:
-        pytest.skip(
-            "sglang not available or failed to import "
-            f"({type(SGL_EXECUTOR_IMPORT_ERROR).__name__}: {SGL_EXECUTOR_IMPORT_ERROR})"
-        )
+        pytest.skip("sglang not available (install with 'pip install -e .[gpu]')")
     if not is_cuda_available():
         pytest.skip("CUDA not available")
 
@@ -179,10 +171,7 @@ def test_cuda_executor_pipeline(ref_model_and_tokenizer):
     This test creates a 2-stage pipeline and verifies it can process requests.
     """
     if SGLExecutor is None:
-        pytest.skip(
-            "sglang not available or failed to import "
-            f"({type(SGL_EXECUTOR_IMPORT_ERROR).__name__}: {SGL_EXECUTOR_IMPORT_ERROR})"
-        )
+        pytest.skip("sglang not available (install with 'pip install -e .[gpu]')")
     if not is_cuda_available():
         pytest.skip("CUDA not available")