We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f4f8a1b commit ebda73dCopy full SHA for ebda73d
1 file changed
python/sglang/srt/layers/quantization/modelopt_quant.py
@@ -79,7 +79,7 @@
79
"SGLANG_CUTEDSL_MOE_SCALAR_INPUT_SCALE", "true"
80
)
81
USE_CUTLASS_BACKEND_FOR_FP4_GEMM = get_bool_env_var(
82
- "SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM"
+ "SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM", "true"
83
84
# TODO make it true by default when the DeepEP PR is merged
85
CUTEDSL_MOE_NVFP4_DISPATCH = get_bool_env_var(
0 commit comments