Skip to content

Commit 34403fa

Browse files
Le-soleileluotao1YqGe585
authored
【CUDA Kernel No.81、88、89、91、92】算子Kernel修复 (#2192)
* fix * 修改路径错误 --------- Co-authored-by: Tao Luo <[email protected]> Co-authored-by: Yuqiang Ge <[email protected]>
1 parent a62d30b commit 34403fa

11 files changed

+15
-10
lines changed

backends/iluvatar_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
#include "paddle/phi/core/kernel_registry.h"
1616
#include "paddle/phi/kernels/full_kernel.h"
1717
#include "paddle/phi/kernels/gpu/moe_permute_utils.h"
18-
#include "paddle/phi/kernels/gpu/moe_unpermute_kernel.cu" //NOLINT
18+
#include "paddle/phi/kernels/gpu/moe_unpermute_kernel.h"
1919

2020
PD_CUSTOM_KERNEL_REGISTER(moe_unpermute,
2121
iluvatar_gpu,

backends/iluvatar_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
// See the License for the specific language governing permissions and
1313
// limitations under the License.
1414
#include "paddle/phi/core/kernel_registry.h"
15-
#include "paddle/phi/kernels/gpu/partial_allgather_kernel.cu" //NOLINT
15+
#include "paddle/phi/kernels/gpu/partial_allgather_kernel.h"
1616
#include "paddle/phi/kernels/partial_concat_kernel.h"
1717

1818
#if (NCCL_VERSION_CODE >= 21000 && CUDA_VERSION >= 11000) || \

backends/iluvatar_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// limitations under the License.
1414

1515
#include "paddle/phi/core/kernel_registry.h"
16-
#include "paddle/phi/kernels/gpu/partial_concat_grad_kernel.cu" //NOLINT
16+
#include "paddle/phi/kernels/gpu/partial_concat_grad_kernel.h"
1717
PD_CUSTOM_KERNEL_REGISTER(partial_concat_grad,
1818
iluvatar_gpu,
1919
ALL_LAYOUT,

backends/iluvatar_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// limitations under the License.
1414

1515
#include "paddle/phi/core/kernel_registry.h"
16-
#include "paddle/phi/kernels/gpu/partial_recv_kernel.cu" //NOLINT
16+
#include "paddle/phi/kernels/partial_recv_kernel.h"
1717
#if (NCCL_VERSION_CODE >= 21000 && CUDA_VERSION >= 11000) || \
1818
defined(PADDLE_WITH_HIP)
1919
PD_CUSTOM_KERNEL_REGISTER(partial_recv,

backends/iluvatar_gpu/kernels/cuda_kernels/partial_send_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// limitations under the License.
1414

1515
#include "paddle/phi/core/kernel_registry.h"
16-
#include "paddle/phi/kernels/gpu/partial_send_kernel.cu" //NOLINT
16+
#include "paddle/phi/kernels/gpu/partial_send_kernel.h"
1717
#if (NCCL_VERSION_CODE >= 21000 && CUDA_VERSION >= 11000) || \
1818
defined(PADDLE_WITH_HIP)
1919
PD_CUSTOM_KERNEL_REGISTER(partial_send,

backends/metax_gpu/CMakeLists.txt

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -124,6 +124,11 @@ file(
124124
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/funcs/math/*.cu
125125
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/funcs/eigen/*.cu
126126
# kernels/gpu
127+
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/partial_send_kernel.cu
128+
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/partial_recv_kernel.cu
129+
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/partial_concat_grad_kernel.cu
130+
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/partial_allgather_kernel.cu
131+
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/ctc_align_kernel.cu
127132
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/yolo_box_head_kernel.cu
128133
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/stft_grad_kernel.cu
129134
${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/soft_relu_grad_kernel.cu

backends/metax_gpu/kernels/cuda_kernels/moe_unpermute_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
#include "paddle/phi/core/kernel_registry.h"
1616
#include "paddle/phi/kernels/full_kernel.h"
1717
#include "paddle/phi/kernels/gpu/moe_permute_utils.h"
18-
#include "paddle/phi/kernels/gpu/moe_unpermute_kernel.cu" //NOLINT
18+
#include "paddle/phi/kernels/gpu/moe_unpermute_kernel.h"
1919

2020
PD_CUSTOM_KERNEL_REGISTER(moe_unpermute,
2121
metax_gpu,

backends/metax_gpu/kernels/cuda_kernels/partial_allgather_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
// See the License for the specific language governing permissions and
1313
// limitations under the License.
1414
#include "paddle/phi/core/kernel_registry.h"
15-
#include "paddle/phi/kernels/gpu/partial_allgather_kernel.cu" //NOLINT
15+
#include "paddle/phi/kernels/gpu/partial_allgather_kernel.h"
1616
#include "paddle/phi/kernels/partial_concat_kernel.h"
1717

1818
#if (NCCL_VERSION_CODE >= 21000 && CUDA_VERSION >= 11000) || \

backends/metax_gpu/kernels/cuda_kernels/partial_concat_grad_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// limitations under the License.
1414

1515
#include "paddle/phi/core/kernel_registry.h"
16-
#include "paddle/phi/kernels/gpu/partial_concat_grad_kernel.cu" //NOLINT
16+
#include "paddle/phi/kernels/gpu/partial_concat_grad_kernel.h"
1717
PD_CUSTOM_KERNEL_REGISTER(partial_concat_grad,
1818
metax_gpu,
1919
ALL_LAYOUT,

backends/metax_gpu/kernels/cuda_kernels/partial_recv_kernel_register.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// limitations under the License.
1414

1515
#include "paddle/phi/core/kernel_registry.h"
16-
#include "paddle/phi/kernels/gpu/partial_recv_kernel.cu" //NOLINT
16+
#include "paddle/phi/kernels/partial_recv_kernel.h"
1717
#if (NCCL_VERSION_CODE >= 21000 && CUDA_VERSION >= 11000) || \
1818
defined(PADDLE_WITH_HIP)
1919
PD_CUSTOM_KERNEL_REGISTER(partial_recv,

0 commit comments

Comments
 (0)