forked from PaddlePaddle/Paddle
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathCMakeLists.txt
More file actions
36 lines (32 loc) · 1.29 KB
/
CMakeLists.txt
File metadata and controls
36 lines (32 loc) · 1.29 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# DeepEP of 2025.05.19, commit: d5ca4495c0c068bc617102841b9322d378fac8ea
if(WITH_NVSHMEM)
set(CMAKE_CUDA_FLAGS
"${CMAKE_CUDA_FLAGS} -rdc=true --ptxas-options=--register-usage-level=10,--warn-on-local-memory-usage"
)
string(REGEX REPLACE "-gencode arch=compute_[0-8][0-9],code=sm_[0-8][0-9]" ""
CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS}")
set(DEEPEP_KERNEL_SRCS
kernels/intranode.cu
kernels/runtime.cu
kernels/internode.cu
kernels/internode_ll.cu
kernels/internode_ll_two_stage.cu
kernels/internode_ll.cu
kernels/m2n_ll_two_stage.cu)
cc_library(
deepep_kernels
SRCS ${DEEPEP_KERNEL_SRCS}
DEPS nvshmem cudadevrt)
set_target_properties(deepep_kernels PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(deepep_kernels PROPERTIES CUDA_RESOLVE_DEVICE_SYMBOLS
ON)
else()
set(DEEPEP_KERNEL_SRCS kernels/intranode.cu kernels/runtime.cu)
cc_library(deepep_kernels SRCS ${DEEPEP_KERNEL_SRCS})
endif()
cc_library(
deep_ep
SRCS deep_ep.cpp src/event_pool.cc src/event.cc src/CUDAStream.cc
DEPS phi common deepep_kernels)
set_target_properties(deep_ep PROPERTIES CUDA_SEPARABLE_COMPILATION OFF)
target_compile_options(deep_ep PRIVATE -Wno-reorder -Wno-unused-variable)