We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 6d9ed8a commit f3dae20Copy full SHA for f3dae20
1 file changed
flashinfer/fused_moe/__init__.py
@@ -15,10 +15,6 @@
15
"""
16
17
from .core import (
18
- ActivationType,
19
- Fp8QuantizationType,
20
- RoutingMethodType,
21
- WeightLayout,
22
convert_to_block_layout,
23
cutlass_fused_moe,
24
gen_cutlass_fused_moe_sm120_module,
@@ -37,6 +33,13 @@
37
33
trtllm_mxint4_block_scale_moe,
38
34
)
39
35
36
+from ..tllm_enums import (
+ ActivationType,
+ Fp8QuantizationType,
+ WeightLayout,
40
+ RoutingMethodType,
41
+)
42
+
43
from .fused_routing_dsv3 import ( # noqa: F401
44
fused_topk_deepseek as fused_topk_deepseek,
45
0 commit comments