Skip to content

Commit f9102aa

Browse files
authored
Merge branch 'main' into alechan/upgrade-xpk-v0.13.0
2 parents a63aa3f + 450fc8f commit f9102aa

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

.github/container/build-te.sh

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -126,8 +126,10 @@ print_var SRC_PATH_XLA
126126
echo "=================================================="
127127

128128
# Parse SM_LIST into the format accepted by TransformerEngine's build system
129-
# "1.2,3.4,5.6" -> "12-real;34-real;56", i.e. SASS plus PTX for the last one
130-
NVTE_CUDA_ARCHS="${SM_LIST//,/-real;}"
129+
# "1.2,3.4,5.6" -> "12;34;56". In principle we would like to compile SASS-only
130+
# plus PTX for the highest known architecture, but TransformerEngine's build
131+
# system does not currently handle that.
132+
NVTE_CUDA_ARCHS="${SM_LIST//,/;}"
131133
set -x
132134
export NVTE_CUDA_ARCHS="${NVTE_CUDA_ARCHS//./}"
133135
# Parallelism within nvcc invocations.

0 commit comments

Comments
 (0)