Skip to content

Commit ebda73d

Browse files
authored
Use cutlass fp4 gemm by default (sgl-project#11813)
1 parent f4f8a1b commit ebda73d

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

python/sglang/srt/layers/quantization/modelopt_quant.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,7 @@
7979
"SGLANG_CUTEDSL_MOE_SCALAR_INPUT_SCALE", "true"
8080
)
8181
USE_CUTLASS_BACKEND_FOR_FP4_GEMM = get_bool_env_var(
82-
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM"
82+
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM", "true"
8383
)
8484
# TODO make it true by default when the DeepEP PR is merged
8585
CUTEDSL_MOE_NVFP4_DISPATCH = get_bool_env_var(

0 commit comments

Comments
 (0)