File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 3030# tools/release_workspace.py.
3131SPDLOG_SUBMODULE_PATH = ROOT_DIR / "csrc" / "third_party" / "spdlog"
3232SPDLOG_HEADER_PATH = SPDLOG_SUBMODULE_PATH / "include" / "spdlog" / "spdlog.h"
33- # Blackwell sm100 is not has been fully tested, so we don't include it in the
34- # default target list.Users with sm100 devices can specify it explicitly with
35- # `CACHE_DIT_CUDA_ARCH_LIST=100` or `TORCH_CUDA_ARCH_LIST=100` when building
36- # the SVDQuant extension.
33+ # sm100 (Blackwell B100/B200, CC 10.0) is not included in the default
34+ # target list because the NVFP4 block-scaled MMA instruction used by the
35+ # SVDQuant FP4 kernel requires sm_120a or higher (PTX ISA, warp-level mma
36+ # Target ISA Notes: ".kind::mxf4nvf4 and .kind::mxf4 are supported on
37+ # sm_120a and sm_121a"). INT4 kernels work correctly on sm100. Users who
38+ # only need INT4 kernels can build for sm100 explicitly via
39+ # CACHE_DIT_CUDA_ARCH_LIST=100 or TORCH_CUDA_ARCH_LIST=100.
3740CUDA_ARCH_ALIASES = {
3841 "maxwell" : "50" ,
3942 "pascal" : "60" ,
4245 "ampere" : "80" ,
4346 "ada" : "89" ,
4447 "hopper" : "90" ,
48+ "blackwell" : "100" ,
4549}
4650
4751
You can’t perform that action at this time.
0 commit comments