Skip to content

Commit 46651af

Browse files
authored
Merge branch 'develop' into mv_xx_axis_op
2 parents c4d57f3 + 71cb016 commit 46651af

File tree

1,029 files changed

+43565
-22297
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

1,029 files changed

+43565
-22297
lines changed

.gitignore

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,9 +7,11 @@ paddle/fluid/op_use_default_grad_maker_DEV.spec
77
paddle/fluid/op_use_default_grad_maker_PR.spec
88
paddle/phi/api/backward/backward_api.h
99
paddle/phi/api/include/api.h
10+
paddle/phi/api/include/sparse_api.h
1011
paddle/phi/api/lib/api.cc
1112
paddle/phi/api/lib/dygraph_api.*
1213
paddle/phi/api/lib/backward_api.cc
14+
paddle/phi/api/lib/sparse_api.cc
1315
paddle/phi/extension.h
1416
paddle/phi/include/*
1517
paddle/phi/infermeta/generated.*
@@ -49,6 +51,9 @@ tools/__pycache__
4951
# This file is automatically generated.
5052
# TODO(zhiqiang) Move this file to build directory.
5153
paddle/infrt/dialect/pd_ops.td
54+
paddle/infrt/dialect/phi/ir/phi_cpu_kernels.td
55+
paddle/infrt/dialect/phi/ir/phi_gpu_kernels.td
56+
tools/infrt/kernels.json
5257
paddle/infrt/dialect/pd_ops_info.h
5358
.lit_test_times.txt
5459
paddle/infrt/tests/dialect/Output

CMakeLists.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -238,7 +238,8 @@ option(WITH_MIPS "Compile PaddlePaddle with mips support" OFF)
238238
option(WITH_MUSL "Compile with musl libc instead of gblic" OFF)
239239
option(WITH_UNITY_BUILD "Compile with UnityBuild mode" OFF)
240240
option(WITH_STRIP "Strip so files of Whl packages" OFF)
241-
option(NEW_RELEASE_CUBIN "PaddlePaddle next-level release strategy for pypi cubin package" OFF)
241+
option(NEW_RELEASE_PYPI "PaddlePaddle next-level release strategy for pypi cubin package" OFF)
242+
option(NEW_RELEASE_ALL "PaddlePaddle next-level release strategy for all arches cubin package" OFF)
242243
option(NEW_RELEASE_JIT "PaddlePaddle next-level release strategy for backup jit package" OFF)
243244
option(WITH_ASCEND_INT64 "Compile with int64 kernel for ascend NPU" OFF)
244245
option(WITH_POCKETFFT "Compile with pocketfft support" ON)

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ English | [简体中文](./README_cn.md)
1515
Welcome to the PaddlePaddle GitHub.
1616

1717
PaddlePaddle, as the only independent R&D deep learning platform in China, has been officially open-sourced to professional communities since 2016. It is an industrial platform with advanced technologies and rich features that cover core deep learning frameworks, basic model libraries, end-to-end development kits, tools & components as well as service platforms.
18-
PaddlePaddle is originated from industrial practices with dedication and commitments to industrialization. It has been widely adopted by a wide range of sectors including manufacturing, agriculture, enterprise service, and so on while serving more than 2.3 million developers. With such advantages, PaddlePaddle has helped an increasing number of partners commercialize AI.
18+
PaddlePaddle is originated from industrial practices with dedication and commitments to industrialization. It has been widely adopted by a wide range of sectors including manufacturing, agriculture, enterprise service, and so on while serving more than 4 million developers. With such advantages, PaddlePaddle has helped an increasing number of partners commercialize AI.
1919

2020

2121

README_cn.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515

1616
欢迎来到 PaddlePaddle GitHub
1717

18-
飞桨(PaddlePaddle)以百度多年的深度学习技术研究和业务应用为基础,是中国首个自主研发、功能完备、 开源开放的产业级深度学习平台,集深度学习核心训练和推理框架、基础模型库、端到端开发套件和丰富的工具组件于一体。目前,飞桨累计开发者265万,服务企业10万家,基于飞桨开源深度学习平台产生了34万个模型。飞桨助力开发者快速实现AI想法,快速上线AI业务。帮助越来越多的行业完成AI赋能,实现产业智能化升级。
18+
飞桨(PaddlePaddle)以百度多年的深度学习技术研究和业务应用为基础,是中国首个自主研发、功能完备、 开源开放的产业级深度学习平台,集深度学习核心训练和推理框架、基础模型库、端到端开发套件和丰富的工具组件于一体。目前,飞桨累计开发者406万,服务企业15.7万家,基于飞桨开源深度学习平台产生了47.6万个模型。飞桨助力开发者快速实现AI想法,快速上线AI业务。帮助越来越多的行业完成AI赋能,实现产业智能化升级。
1919

2020
## 安装
2121

cmake/cuda.cmake

Lines changed: 13 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -6,16 +6,22 @@ if(WITH_NV_JETSON)
66
add_definitions(-DWITH_NV_JETSON)
77
set(paddle_known_gpu_archs "53 62 72")
88
set(paddle_known_gpu_archs10 "53 62 72")
9-
elseif(NEW_RELEASE_CUBIN)
9+
elseif(NEW_RELEASE_ALL)
10+
message("Using New Release Strategy - All Arches Packge")
11+
add_definitions(-DNEW_RELEASE_ALL)
12+
set(paddle_known_gpu_archs "35 50 52 60 61 70 75 80 86")
13+
set(paddle_known_gpu_archs10 "35 50 52 60 61 70 75")
14+
set(paddle_known_gpu_archs11 "35 50 52 60 61 70 75 80")
15+
elseif(NEW_RELEASE_PYPI)
1016
message("Using New Release Strategy - Cubin Packge")
11-
add_definitions(-DNEW_RELEASE_CUBIN)
12-
set(paddle_known_gpu_archs "35 37 50 52 60 61 70 75 80 86")
13-
set(paddle_known_gpu_archs10 "50 60 70 75")
14-
set(paddle_known_gpu_archs11 "60 70 75 80")
17+
add_definitions(-DNEW_RELEASE_PYPI)
18+
set(paddle_known_gpu_archs "35 50 52 60 61 70 75 80 86")
19+
set(paddle_known_gpu_archs10 "")
20+
set(paddle_known_gpu_archs11 "60 61 70 75 80")
1521
elseif(NEW_RELEASE_JIT)
1622
message("Using New Release Strategy - JIT Packge")
1723
add_definitions(-DNEW_RELEASE_JIT)
18-
set(paddle_known_gpu_archs "35 37 50 52 60 61 70 75 80 86")
24+
set(paddle_known_gpu_archs "35 50 52 60 61 70 75 80 86")
1925
set(paddle_known_gpu_archs10 "35 50 60 70 75")
2026
set(paddle_known_gpu_archs11 "35 50 60 70 75 80")
2127
else()
@@ -148,7 +154,7 @@ function(select_nvcc_arch_flags out_variable)
148154

149155
# remove dots and convert to lists
150156
string(REGEX REPLACE "\\." "" cuda_arch_bin "${cuda_arch_bin}")
151-
string(REGEX REPLACE "\\." "" cuda_arch_ptx "${CUDA_ARCH_PTX}")
157+
string(REGEX REPLACE "\\." "" cuda_arch_ptx "${cuda_arch_ptx}")
152158
string(REGEX MATCHALL "[0-9()]+" cuda_arch_bin "${cuda_arch_bin}")
153159
string(REGEX MATCHALL "[0-9]+" cuda_arch_ptx "${cuda_arch_ptx}")
154160

cmake/external/xpu.cmake

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ ENDIF()
3636

3737
if(NOT DEFINED XPU_BASE_URL)
3838
SET(XPU_BASE_URL_WITHOUT_DATE "https://baidu-kunlun-product.cdn.bcebos.com/KL-SDK/klsdk-dev")
39-
SET(XPU_BASE_URL "${XPU_BASE_URL_WITHOUT_DATE}/20220219")
39+
SET(XPU_BASE_URL "${XPU_BASE_URL_WITHOUT_DATE}/20220228")
4040
else()
4141
SET(XPU_BASE_URL "${XPU_BASE_URL}")
4242
endif()

cmake/generic.cmake

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -580,8 +580,8 @@ function(hip_library TARGET_NAME)
580580
cmake_parse_arguments(hip_library "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
581581
if(hip_library_SRCS)
582582
# FindHIP.cmake defined hip_add_library, HIP_SOURCE_PROPERTY_FORMAT is requried if no .cu files found
583-
if(NOT ${CMAKE_CURRENT_SOURCE_DIR} MATCHES ".*/operators")
584-
set_source_files_properties(${hip_library_SRCS} PROPERTIES HIP_SOURCE_PROPERTY_FORMAT 1)
583+
if(NOT (${CMAKE_CURRENT_SOURCE_DIR} MATCHES ".*/operators" OR ${CMAKE_CURRENT_SOURCE_DIR} MATCHES ".*/phi/kernels"))
584+
set_source_files_properties(${hip_library_SRCS} PROPERTIES HIP_SOURCE_PROPERTY_FORMAT 1)
585585
endif()
586586
if (hip_library_SHARED OR hip_library_shared) # build *.so
587587
hip_add_library(${TARGET_NAME} SHARED ${hip_library_SRCS})
@@ -651,6 +651,7 @@ function(hip_test TARGET_NAME)
651651
set_property(TEST ${TARGET_NAME} PROPERTY ENVIRONMENT FLAGS_cpu_deterministic=true)
652652
set_property(TEST ${TARGET_NAME} PROPERTY ENVIRONMENT FLAGS_init_allocated_mem=true)
653653
set_property(TEST ${TARGET_NAME} PROPERTY ENVIRONMENT FLAGS_cudnn_deterministic=true)
654+
set_property(TEST ${TARGET_NAME} PROPERTY ENVIRONMENT "LD_LIBRARY_PATH=${CMAKE_BINARY_DIR}/python/paddle/libs:$LD_LIBRARY_PATH")
654655
endif()
655656
endfunction(hip_test)
656657

@@ -667,6 +668,7 @@ function(xpu_library TARGET_NAME)
667668
else()
668669
xpu_add_library(${TARGET_NAME} STATIC ${xpu_library_SRCS} DEPENDS ${xpu_library_DEPS})
669670
find_fluid_modules(${TARGET_NAME})
671+
find_phi_modules(${TARGET_NAME})
670672
endif()
671673
if (xpu_library_DEPS)
672674
add_dependencies(${TARGET_NAME} ${xpu_library_DEPS})

cmake/phi.cmake

Lines changed: 52 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -83,6 +83,8 @@ function(kernel_declare TARGET_LIST)
8383
file(APPEND ${kernel_declare_file} "PD_DECLARE_KERNEL(${kernel_name}, XPU, ALL_LAYOUT);\n")
8484
elseif (${kernel_path} MATCHES "./gpudnn\/")
8585
file(APPEND ${kernel_declare_file} "PD_DECLARE_KERNEL(${kernel_name}, GPUDNN, ALL_LAYOUT);\n")
86+
elseif (${kernel_path} MATCHES "./kps\/")
87+
file(APPEND ${kernel_declare_file} "PD_DECLARE_KERNEL(${kernel_name}, KPS, ALL_LAYOUT);\n")
8688
else ()
8789
# deal with device independent kernel, now we use CPU temporaary
8890
file(APPEND ${kernel_declare_file} "PD_DECLARE_KERNEL(${kernel_name}, CPU, ALL_LAYOUT);\n")
@@ -97,6 +99,7 @@ function(kernel_library TARGET)
9799
set(gpu_srcs)
98100
set(xpu_srcs)
99101
set(gpudnn_srcs)
102+
set(kps_srcs)
100103
set(selected_rows_srcs)
101104
# parse and save the deps kerenl targets
102105
set(all_srcs)
@@ -128,6 +131,9 @@ function(kernel_library TARGET)
128131
if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/gpu/${TARGET}.cu.cc)
129132
list(APPEND gpu_srcs ${CMAKE_CURRENT_SOURCE_DIR}/gpu/${TARGET}.cu.cc)
130133
endif()
134+
if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/kps/${TARGET}.cu)
135+
list(APPEND gpu_srcs ${CMAKE_CURRENT_SOURCE_DIR}/kps/${TARGET}.cu)
136+
endif()
131137
if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/gpudnn/${TARGET}_gpudnn.cu)
132138
list(APPEND gpudnn_srcs ${CMAKE_CURRENT_SOURCE_DIR}/gpudnn/${TARGET}_gpudnn.cu)
133139
endif()
@@ -137,6 +143,15 @@ function(kernel_library TARGET)
137143
list(APPEND xpu_srcs ${CMAKE_CURRENT_SOURCE_DIR}/xpu/${TARGET}.cc)
138144
endif()
139145
endif()
146+
if (WITH_XPU_KP)
147+
if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/kps/${TARGET}.cu)
148+
# Change XPU2 file suffix
149+
# NOTE(chenweihang): If we can be sure that the *.kps suffix is no longer used, it can be copied directly to *.xpu
150+
file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/kps/${TARGET}.cu DESTINATION ${CMAKE_CURRENT_BINARY_DIR}/kps)
151+
file(RENAME ${CMAKE_CURRENT_BINARY_DIR}/kps/${TARGET}.cu ${CMAKE_CURRENT_BINARY_DIR}/kps/${TARGET}.kps)
152+
list(APPEND kps_srcs ${CMAKE_CURRENT_BINARY_DIR}/kps/${TARGET}.kps)
153+
endif()
154+
endif()
140155
else()
141156
# TODO(chenweihang): impl compile by source later
142157
endif()
@@ -150,6 +165,7 @@ function(kernel_library TARGET)
150165
list(APPEND all_srcs ${gpu_srcs})
151166
list(APPEND all_srcs ${xpu_srcs})
152167
list(APPEND all_srcs ${gpudnn_srcs})
168+
list(APPEND all_srcs ${kps_srcs})
153169
foreach(src ${all_srcs})
154170
file(READ ${src} target_content)
155171
string(REGEX MATCHALL "#include \"paddle\/phi\/kernels\/[a-z0-9_]+_kernel.h\"" include_kernels ${target_content})
@@ -159,11 +175,11 @@ function(kernel_library TARGET)
159175
string(REGEX MATCHALL "#include \"paddle\/phi\/kernels\/${kernel_library_SUB_DIR}\/[a-z0-9_]+_kernel.h\"" include_kernels ${target_content})
160176
endif()
161177
foreach(include_kernel ${include_kernels})
162-
if ("${kernel_library_SUB_DIR}" STREQUAL "")
163-
string(REGEX REPLACE "#include \"paddle\/phi\/kernels\/" "" kernel_name ${include_kernel})
164-
else()
165-
string(REGEX REPLACE "#include \"paddle\/phi\/kernels\/${kernel_library_SUB_DIR}\/" "" kernel_name ${include_kernel})
166-
endif()
178+
if ("${kernel_library_SUB_DIR}" STREQUAL "")
179+
string(REGEX REPLACE "#include \"paddle\/phi\/kernels\/" "" kernel_name ${include_kernel})
180+
else()
181+
string(REGEX REPLACE "#include \"paddle\/phi\/kernels\/${kernel_library_SUB_DIR}\/" "" kernel_name ${include_kernel})
182+
endif()
167183
string(REGEX REPLACE ".h\"" "" kernel_name ${kernel_name})
168184
list(APPEND kernel_deps ${kernel_name})
169185
endforeach()
@@ -176,11 +192,20 @@ function(kernel_library TARGET)
176192
list(LENGTH gpu_srcs gpu_srcs_len)
177193
list(LENGTH xpu_srcs xpu_srcs_len)
178194
list(LENGTH gpudnn_srcs gpudnn_srcs_len)
195+
list(LENGTH kps_srcs kps_srcs_len)
179196
list(LENGTH selected_rows_srcs selected_rows_srcs_len)
180197

198+
# kernel source file level
199+
# level 1: base device kernel
200+
# - cpu_srcs / gpu_srcs / xpu_srcs / kps_srcs
201+
# level 2: device-independent kernel
202+
# - common_srcs
203+
# level 3: Kernel implemented by reusing device-independent kernel
204+
# - selected_rows_srcs
205+
181206
# Build Target according different src organization
182207
if((${cpu_srcs_len} GREATER 0 OR ${gpu_srcs_len} GREATER 0 OR
183-
${xpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0) AND
208+
${xpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0 OR ${kps_srcs_len} GREATER 0) AND
184209
(${common_srcs_len} GREATER 0 OR ${selected_rows_srcs_len} GREATER 0))
185210
# If the common_srcs/selected_rows_srcs depends on specific device srcs, build target using this rule.
186211
if (WITH_GPU)
@@ -193,14 +218,19 @@ function(kernel_library TARGET)
193218
hip_library(${TARGET}_part SRCS ${cpu_srcs} ${gpu_srcs} ${gpudnn_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
194219
hip_library(${TARGET} SRCS ${common_srcs} ${selected_rows_srcs} DEPS ${TARGET}_part)
195220
endif()
221+
elseif (WITH_XPU_KP)
222+
if (${cpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR ${kps_srcs_len} GREATER 0)
223+
xpu_library(${TARGET}_part SRCS ${cpu_srcs} ${xpu_srcs} ${kps_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
224+
xpu_library(${TARGET} SRCS ${common_srcs} ${selected_rows_srcs} DEPS ${TARGET}_part)
225+
endif()
196226
else()
197227
if (${cpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0)
198228
cc_library(${TARGET}_part SRCS ${cpu_srcs} ${xpu_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
199229
cc_library(${TARGET} SRCS ${common_srcs} ${selected_rows_srcs} DEPS ${TARGET}_part)
200230
endif()
201231
endif()
202232
# If there are only specific device srcs, build target using this rule.
203-
elseif (${cpu_srcs_len} GREATER 0 OR ${gpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0)
233+
elseif (${cpu_srcs_len} GREATER 0 OR ${gpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0 OR ${kps_srcs_len} GREATER 0)
204234
if (WITH_GPU)
205235
if (${cpu_srcs_len} GREATER 0 OR ${gpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0)
206236
nv_library(${TARGET} SRCS ${cpu_srcs} ${gpu_srcs} ${gpudnn_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
@@ -209,6 +239,10 @@ function(kernel_library TARGET)
209239
if (${cpu_srcs_len} GREATER 0 OR ${gpu_srcs_len} GREATER 0 OR ${gpudnn_srcs_len} GREATER 0)
210240
hip_library(${TARGET} SRCS ${cpu_srcs} ${gpu_srcs} ${gpudnn_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
211241
endif()
242+
elseif (WITH_XPU_KP)
243+
if (${cpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR ${kps_srcs_len} GREATER 0)
244+
xpu_library(${TARGET} SRCS ${cpu_srcs} ${xpu_srcs} ${kps_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
245+
endif()
212246
else()
213247
if (${cpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0)
214248
cc_library(${TARGET} SRCS ${cpu_srcs} ${xpu_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
@@ -222,6 +256,9 @@ function(kernel_library TARGET)
222256
elseif (WITH_ROCM)
223257
hip_library(${TARGET}_part SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
224258
hip_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${TARGET}_part)
259+
elseif (WITH_XPU_KP)
260+
xpu_library(${TARGET}_part SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
261+
xpu_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${TARGET}_part)
225262
else()
226263
cc_library(${TARGET}_part SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
227264
cc_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${TARGET}_part)
@@ -232,6 +269,8 @@ function(kernel_library TARGET)
232269
nv_library(${TARGET} SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
233270
elseif (WITH_ROCM)
234271
hip_library(${TARGET} SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
272+
elseif (WITH_XPU_KP)
273+
xpu_library(${TARGET} SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
235274
else()
236275
cc_library(${TARGET} SRCS ${common_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
237276
endif()
@@ -240,6 +279,8 @@ function(kernel_library TARGET)
240279
nv_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
241280
elseif (WITH_ROCM)
242281
hip_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
282+
elseif (WITH_XPU_KP)
283+
xpu_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
243284
else()
244285
cc_library(${TARGET} SRCS ${selected_rows_srcs} DEPS ${kernel_library_DEPS} ${kernel_deps})
245286
endif()
@@ -249,7 +290,7 @@ function(kernel_library TARGET)
249290

250291
if (${target_build_flag} EQUAL 1)
251292
if (${common_srcs_len} GREATER 0 OR ${cpu_srcs_len} GREATER 0 OR
252-
${gpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR
293+
${gpu_srcs_len} GREATER 0 OR ${xpu_srcs_len} GREATER 0 OR ${kps_srcs_len} GREATER 0 OR
253294
${gpudnn_srcs_len} GREATER 0 OR ${selected_rows_srcs_len} GREATER 0)
254295
# append target into PHI_KERNELS property
255296
get_property(phi_kernels GLOBAL PROPERTY PHI_KERNELS)
@@ -275,6 +316,9 @@ function(kernel_library TARGET)
275316
if (${gpudnn_srcs_len} GREATER 0)
276317
kernel_declare(${gpudnn_srcs})
277318
endif()
319+
if (${kps_srcs_len} GREATER 0)
320+
kernel_declare(${kps_srcs})
321+
endif()
278322
if (${selected_rows_srcs_len} GREATER 0)
279323
kernel_declare(${selected_rows_srcs})
280324
endif()

paddle/fluid/distributed/collective/CMakeLists.txt

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,8 @@
11
cc_library(processgroup SRCS ProcessGroup.cc DEPS phi phi_api eager_api)
2+
if (WITH_DISTRIBUTE)
3+
cc_library(processgroup_gloo SRCS ProcessGroupGloo.cc DEPS phi phi_api eager_api gloo_wrapper)
4+
endif()
5+
cc_library(eager_reducer SRCS reducer.cc DEPS eager_api processgroup)
26

37
if(WITH_NCCL)
48
cc_library(processgroup_nccl SRCS ProcessGroupNCCL.cc DEPS place cuda_stream enforce collective_helper device_context phi phi_api eager_api)

0 commit comments

Comments
 (0)