Skip to content

Commit 769c525

Browse files
committed
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into add_leaky_relu_op_npu
2 parents d315202 + 8009257 commit 769c525

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

54 files changed

+2609
-446
lines changed

CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -130,7 +130,7 @@ if(WIN32)
130130
# NOTE(zhouwei25): GPU compile have too high memory utilization when parallel compiling,
131131
# For Visual Studio generators, /MP should be added.
132132
# For other generators like Ninja, it is not need to add /MP.
133-
if("${CMAKE_GENERATOR}" STREQUAL "Visual Studio" AND NOT WITH_GPU)
133+
if(CMAKE_GENERATOR MATCHES "Visual Studio" AND NOT WITH_GPU)
134134
math(EXPR PROCESS_MAX "${CPU_CORES} * 2 / 3")
135135
set(${flag_var} "${${flag_var}} /MP${PROCESS_MAX}")
136136
endif()

cmake/external/gflags.cmake

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,6 +41,7 @@ ExternalProject_Add(
4141
${SHALLOW_CLONE}
4242
"${GFLAGS_DOWNLOAD_CMD}"
4343
PREFIX ${GFLAGS_PREFIX_DIR}
44+
UPDATE_COMMAND ""
4445
SOURCE_DIR ${GFLAGS_SOURCE_DIR}
4546
BUILD_COMMAND ${BUILD_COMMAND}
4647
INSTALL_COMMAND ${INSTALL_COMMAND}

cmake/external/glog.cmake

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ ExternalProject_Add(
4545
DEPENDS gflags
4646
PREFIX ${GLOG_PREFIX_DIR}
4747
SOURCE_DIR ${GLOG_SOURCE_DIR}
48+
UPDATE_COMMAND ""
4849
CMAKE_ARGS -DCMAKE_CXX_COMPILER=${CMAKE_CXX_COMPILER}
4950
-DCMAKE_C_COMPILER=${CMAKE_C_COMPILER}
5051
-DCMAKE_CXX_FLAGS=${GLOG_CMAKE_CXX_FLAGS}

cmake/external/mkldnn.cmake

Lines changed: 25 additions & 30 deletions
Original file line numberDiff line numberDiff line change
@@ -79,49 +79,44 @@ ExternalProject_Add(
7979
-DCMAKE_CXX_FLAGS=${MKLDNN_CXXFLAG}
8080
-DDNNL_BUILD_TESTS=OFF -DDNNL_BUILD_EXAMPLES=OFF
8181
CMAKE_CACHE_ARGS -DCMAKE_INSTALL_PREFIX:PATH=${MKLDNN_INSTALL_DIR}
82-
BUILD_BYPRODUCTS ${MKLDNN_LIB}
8382
)
8483

85-
ADD_LIBRARY(shared_mkldnn SHARED IMPORTED GLOBAL)
86-
SET_PROPERTY(TARGET shared_mkldnn PROPERTY IMPORTED_LOCATION ${MKLDNN_LIB})
87-
ADD_DEPENDENCIES(shared_mkldnn ${MKLDNN_PROJECT})
8884
MESSAGE(STATUS "MKLDNN library: ${MKLDNN_LIB}")
8985
add_definitions(-DPADDLE_WITH_MKLDNN)
90-
91-
# generate a static dummy target to track mkldnn dependencies
92-
# for cc_library(xxx SRCS xxx.c DEPS mkldnn)
93-
generate_dummy_static_lib(LIB_NAME "mkldnn" GENERATOR "mkldnn.cmake")
94-
95-
TARGET_LINK_LIBRARIES(mkldnn ${MKLDNN_LIB} ${MKLML_IOMP_LIB})
96-
ADD_DEPENDENCIES(mkldnn ${MKLDNN_PROJECT})
97-
9886
# copy the real so.0 lib to install dir
9987
# it can be directly contained in wheel or capi
10088
if(WIN32)
10189
SET(MKLDNN_SHARED_LIB ${MKLDNN_INSTALL_DIR}/bin/mkldnn.dll)
10290

10391
file(TO_NATIVE_PATH ${MKLDNN_INSTALL_DIR} NATIVE_MKLDNN_INSTALL_DIR)
10492
file(TO_NATIVE_PATH ${MKLDNN_SHARED_LIB} NATIVE_MKLDNN_SHARED_LIB)
105-
ADD_CUSTOM_COMMAND(TARGET ${MKLDNN_PROJECT} POST_BUILD
106-
COMMAND (copy ${NATIVE_MKLDNN_INSTALL_DIR}\\bin\\dnnl.dll ${NATIVE_MKLDNN_SHARED_LIB} /Y))
107-
add_custom_command(TARGET ${MKLDNN_PROJECT} POST_BUILD VERBATIM
108-
COMMAND dumpbin /exports ${MKLDNN_INSTALL_DIR}/bin/mkldnn.dll > ${MKLDNN_INSTALL_DIR}/bin/exports.txt)
109-
add_custom_command(TARGET ${MKLDNN_PROJECT} POST_BUILD VERBATIM
110-
COMMAND echo LIBRARY mkldnn > ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def)
111-
add_custom_command(TARGET ${MKLDNN_PROJECT} POST_BUILD VERBATIM
112-
COMMAND echo EXPORTS >> ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def)
113-
add_custom_command(TARGET ${MKLDNN_PROJECT} POST_BUILD VERBATIM
114-
COMMAND echo off && (for /f "skip=19 tokens=4" %A in (${MKLDNN_INSTALL_DIR}/bin/exports.txt) do echo %A >> ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def) && echo on)
115-
add_custom_command(TARGET ${MKLDNN_PROJECT} POST_BUILD VERBATIM
116-
COMMAND lib /def:${MKLDNN_INSTALL_DIR}/bin/mkldnn.def /out:${MKLDNN_INSTALL_DIR}/bin/mkldnn.lib /machine:x64)
93+
94+
ADD_CUSTOM_COMMAND(OUTPUT ${MKLDNN_LIB}
95+
COMMAND (copy ${NATIVE_MKLDNN_INSTALL_DIR}\\bin\\dnnl.dll ${NATIVE_MKLDNN_SHARED_LIB} /Y)
96+
COMMAND dumpbin /exports ${MKLDNN_INSTALL_DIR}/bin/mkldnn.dll > ${MKLDNN_INSTALL_DIR}/bin/exports.txt
97+
COMMAND echo LIBRARY mkldnn > ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def
98+
COMMAND echo EXPORTS >> ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def
99+
COMMAND echo off && (for /f "skip=19 tokens=4" %A in (${MKLDNN_INSTALL_DIR}/bin/exports.txt) do echo %A >> ${MKLDNN_INSTALL_DIR}/bin/mkldnn.def) && echo on
100+
COMMAND lib /def:${MKLDNN_INSTALL_DIR}/bin/mkldnn.def /out:${MKLDNN_LIB} /machine:x64
101+
COMMENT "Generate mkldnn.lib manually--->"
102+
DEPENDS ${MKLDNN_PROJECT}
103+
VERBATIM)
104+
ADD_CUSTOM_TARGET(mkldnn_cmd ALL DEPENDS ${MKLDNN_LIB})
117105
else(WIN32)
118106
SET(MKLDNN_SHARED_LIB ${MKLDNN_INSTALL_DIR}/libmkldnn.so.0)
119107
SET(MKLDNN_SHARED_LIB_1 ${MKLDNN_INSTALL_DIR}/libdnnl.so.1)
120108
SET(MKLDNN_SHARED_LIB_2 ${MKLDNN_INSTALL_DIR}/libdnnl.so.2)
121-
ADD_CUSTOM_COMMAND(TARGET ${MKLDNN_PROJECT} POST_BUILD
122-
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB})
123-
ADD_CUSTOM_COMMAND(TARGET ${MKLDNN_PROJECT} POST_BUILD
124-
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB_1})
125-
ADD_CUSTOM_COMMAND(TARGET ${MKLDNN_PROJECT} POST_BUILD
126-
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB_2})
109+
ADD_CUSTOM_COMMAND(OUTPUT ${MKLDNN_SHARED_LIB_2}
110+
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB}
111+
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB_1}
112+
COMMAND ${CMAKE_COMMAND} -E copy ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB_2}
113+
DEPENDS ${MKLDNN_PROJECT})
114+
ADD_CUSTOM_TARGET(mkldnn_cmd ALL DEPENDS ${MKLDNN_SHARED_LIB_2})
127115
endif(WIN32)
116+
117+
# generate a static dummy target to track mkldnn dependencies
118+
# for cc_library(xxx SRCS xxx.c DEPS mkldnn)
119+
generate_dummy_static_lib(LIB_NAME "mkldnn" GENERATOR "mkldnn.cmake")
120+
121+
TARGET_LINK_LIBRARIES(mkldnn ${MKLDNN_LIB} ${MKLML_IOMP_LIB})
122+
ADD_DEPENDENCIES(mkldnn ${MKLDNN_PROJECT} mkldnn_cmd)

cmake/external/protobuf.cmake

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -198,16 +198,16 @@ FUNCTION(build_protobuf TARGET_NAME BUILD_FOR_HOST)
198198
"-Dprotobuf_MSVC_STATIC_RUNTIME=${MSVC_STATIC_CRT}")
199199
ENDIF()
200200

201-
if(WITH_ASCEND AND NOT WITH_ASCEND_CXX11)
202-
SET(PROTOBUF_REPOSITORY https://gitee.com/tianjianhe/protobuf.git)
203-
SET(PROTOBUF_TAG v3.8.0)
204-
elseif(WITH_ASCEND_CL AND NOT WITH_ASCEND_CXX11)
205-
SET(PROTOBUF_REPOSITORY https://gitee.com/tianjianhe/protobuf.git)
206-
SET(PROTOBUF_TAG v3.8.0)
207-
else()
208-
SET(PROTOBUF_REPOSITORY ${GIT_URL}/protocolbuffers/protobuf.git)
209-
SET(PROTOBUF_TAG 9f75c5aa851cd877fb0d93ccc31b8567a6706546)
210-
endif()
201+
if(WITH_ASCEND AND NOT WITH_ASCEND_CXX11)
202+
SET(PROTOBUF_REPOSITORY https://gitee.com/tianjianhe/protobuf.git)
203+
SET(PROTOBUF_TAG v3.8.0)
204+
elseif(WITH_ASCEND_CL AND NOT WITH_ASCEND_CXX11)
205+
SET(PROTOBUF_REPOSITORY https://gitee.com/tianjianhe/protobuf.git)
206+
SET(PROTOBUF_TAG v3.8.0)
207+
else()
208+
SET(PROTOBUF_REPOSITORY ${GIT_URL}/protocolbuffers/protobuf.git)
209+
SET(PROTOBUF_TAG 9f75c5aa851cd877fb0d93ccc31b8567a6706546)
210+
endif()
211211

212212
cache_third_party(${TARGET_NAME}
213213
REPOSITORY ${PROTOBUF_REPOSITORY}

cmake/external/pybind11.cmake

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@ ExternalProject_Add(
3939
# to be modified without triggering incremental compilation, and the
4040
# third-party library version changes cannot be incorporated.
4141
# reference: https://cmake.org/cmake/help/latest/module/ExternalProject.html
42+
UPDATE_COMMAND ""
4243
CONFIGURE_COMMAND ""
4344
BUILD_COMMAND ""
4445
INSTALL_COMMAND ""

cmake/external/xpu.cmake

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ ELSE ()
3535
ENDIF()
3636

3737
SET(XPU_BASE_URL_WITHOUT_DATE "https://baidu-kunlun-product.cdn.bcebos.com/KL-SDK/klsdk-dev")
38-
SET(XPU_BASE_URL "${XPU_BASE_URL_WITHOUT_DATE}/20210729")
38+
SET(XPU_BASE_URL "${XPU_BASE_URL_WITHOUT_DATE}/20210804")
3939
SET(XPU_XRE_URL "${XPU_BASE_URL}/${XPU_XRE_DIR_NAME}.tar.gz" CACHE STRING "" FORCE)
4040
SET(XPU_XDNN_URL "${XPU_BASE_URL}/${XPU_XDNN_DIR_NAME}.tar.gz" CACHE STRING "" FORCE)
4141
SET(XPU_XCCL_URL "${XPU_BASE_URL_WITHOUT_DATE}/20210623/${XPU_XCCL_DIR_NAME}.tar.gz" CACHE STRING "" FORCE)

paddle/fluid/framework/ir/multi_devices_graph_pass/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,4 +18,4 @@ cc_library(fuse_all_reduce_op_pass SRCS fuse_all_reduce_op_pass.cc DEPS graph gr
1818
cc_library(all_reduce_deps_pass SRCS all_reduce_deps_pass.cc DEPS all_reduce_op_handle graph graph_helper pass)
1919
cc_library(backward_optimizer_op_deps_pass SRCS backward_optimizer_op_deps_pass.cc DEPS graph graph_helper pass)
2020
cc_library(add_reader_dependency_pass SRCS add_reader_dependency_pass.cc DEPS graph graph_helper pass)
21-
cc_library(fix_op_run_order_pass SRCS fix_op_run_order_pass DEPS graph graph_helper multi_devices_helper pass op_handle_base eager_deletion_op_handle)
21+
cc_library(fix_op_run_order_pass SRCS fix_op_run_order_pass.cc DEPS graph graph_helper multi_devices_helper pass op_handle_base eager_deletion_op_handle)

paddle/fluid/framework/operator.cc

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1254,9 +1254,10 @@ void OperatorWithKernel::ChooseKernel(const RuntimeContext& ctx,
12541254
}
12551255
#endif
12561256
#ifdef PADDLE_WITH_XPU
1257-
if (kernel_iter == kernels.end() &&
1258-
is_xpu_place(expected_kernel_key.place_) &&
1259-
!paddle::platform::is_xpu_support_op(type_, expected_kernel_key)) {
1257+
if ((kernel_iter == kernels.end() &&
1258+
is_xpu_place(expected_kernel_key.place_) &&
1259+
!paddle::platform::is_xpu_support_op(type_, expected_kernel_key)) ||
1260+
paddle::platform::is_in_xpu_black_list(type_)) {
12601261
VLOG(3) << "missing XPU kernel: " << type_
12611262
<< ", expected_kernel_key:" << expected_kernel_key
12621263
<< ", fallbacking to CPU one!";

paddle/fluid/imperative/prepared_operator.cc

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -131,9 +131,10 @@ PreparedOp PrepareImpl(const NameVarMap<VarType>& ins,
131131
auto& kernels = kernels_iter->second;
132132
auto kernel_iter = kernels.find(expected_kernel_key);
133133
#ifdef PADDLE_WITH_XPU
134-
if (kernel_iter == kernels.end() &&
135-
is_xpu_place(expected_kernel_key.place_) &&
136-
!paddle::platform::is_xpu_support_op(op.Type(), expected_kernel_key)) {
134+
if ((kernel_iter == kernels.end() &&
135+
is_xpu_place(expected_kernel_key.place_) &&
136+
!paddle::platform::is_xpu_support_op(op.Type(), expected_kernel_key)) ||
137+
paddle::platform::is_in_xpu_black_list(op.Type())) {
137138
VLOG(3) << "missing XPU kernel: " << op.Type()
138139
<< ", expected_kernel_key:" << expected_kernel_key
139140
<< ", fallbacking to CPU one!";

0 commit comments

Comments
 (0)