.. currentmodule:: flashinfer.gemm
This module provides a set of GEMM operations.
.. autosummary::
:toctree: ../generated
mm_bf16
bmm_bf16
.. autosummary::
:toctree: ../generated
mm_fp4
.. autosummary::
:toctree: ../generated
bmm_fp8
gemm_fp8_nt_groupwise
group_gemm_fp8_nt_groupwise
group_deepgemm_fp8_nt_groupwise
batch_deepgemm_fp8_nt_groupwise
.. autosummary::
:toctree: ../generated
group_gemm_mxfp4_nt_groupwise
.. autoclass:: SegmentGEMMWrapper
:members:
:exclude-members: forward
.. automethod:: __init__