|
36 | 36 | ) |
37 | 37 |
|
38 | 38 | # CuTe-DSL kernels (conditionally exported) |
| 39 | +# Note: is_cute_dsl_available is used internally but not re-exported; |
| 40 | +# users should import from flashinfer.cute_dsl |
39 | 41 | from ..cute_dsl import is_cute_dsl_available |
40 | 42 |
|
41 | 43 | if is_cute_dsl_available(): |
42 | | - from .mxfp8_quantize_cute_dsl import ( |
43 | | - mxfp8_quantize_cute_dsl, |
44 | | - MXFP8QuantizeLinearKernel, |
45 | | - MXFP8QuantizeSwizzledKernel, |
46 | | - _get_compiled_kernel_linear, |
47 | | - _get_compiled_kernel_swizzled, |
48 | | - ) |
| 44 | + from .mxfp8_quantize_cute_dsl import mxfp8_quantize_cute_dsl |
49 | 45 |
|
50 | 46 | __all__ = [ |
51 | 47 | # Packbits |
|
69 | 65 | "shuffle_matrix_sf_a", |
70 | 66 | "scaled_fp4_grouped_quantize", |
71 | 67 | "get_fp4_quantization_module", |
72 | | - # CuTe-DSL availability check |
73 | | - "is_cute_dsl_available", |
74 | 68 | ] |
75 | 69 |
|
76 | 70 | if is_cute_dsl_available(): |
77 | 71 | __all__ += [ |
78 | 72 | "mxfp8_quantize_cute_dsl", |
79 | | - "MXFP8QuantizeLinearKernel", |
80 | | - "MXFP8QuantizeSwizzledKernel", |
81 | | - "_get_compiled_kernel_linear", |
82 | | - "_get_compiled_kernel_swizzled", |
83 | 73 | ] |
0 commit comments