From fcd8bcbdf55713b2373876efc2338873c1e3e043 Mon Sep 17 00:00:00 2001 From: wangjiabao <204268140@qq.com> Date: Sat, 27 Sep 2025 16:56:21 +0800 Subject: [PATCH 1/3] =?UTF-8?q?=E3=80=90CUDA=20Kernel=20No.8=E3=80=91fused?= =?UTF-8?q?=5Fseqpool=5Fcvm=E7=AE=97=E5=AD=90Kernel=E4=BF=AE=E5=A4=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu | 2 +- .../kernels/fusion/fused_seqpool_cvm_kernel_register.cu | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu index 040aadaddbd..88c3ad47461 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/core/mixed_vector.h" -#include "paddle/phi/kernels/fusion/gpu/fused_seqpool_cvm_kernel.cu" //NOLINT +#include "paddle/phi/kernels/fused_seqpool_cvm_kernel.h" PD_CUSTOM_KERNEL_REGISTER(fused_seqpool_cvm, iluvatar_gpu, diff --git a/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu b/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu index 2505a742a06..5b552b6298d 100644 --- a/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu +++ b/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/core/mixed_vector.h" -#include "paddle/phi/kernels/fusion/gpu/fused_seqpool_cvm_kernel.cu" //NOLINT +#include "paddle/phi/kernels/fused_seqpool_cvm_kernel.h" PD_CUSTOM_KERNEL_REGISTER(fused_seqpool_cvm, metax_gpu, From 9af8449f711e9d22663531dbd119c3f15eb7fab9 Mon Sep 17 00:00:00 2001 From: wangjiabao <204268140@qq.com> Date: Sat, 27 Sep 2025 16:59:56 +0800 Subject: [PATCH 2/3] =?UTF-8?q?=E3=80=90CUDA=20Kernel=20No.9=E3=80=91fused?= =?UTF-8?q?=5Fsoftmax=5Fmask=5Fgrad=E7=AE=97=E5=AD=90Kernel=E4=BF=AE?= =?UTF-8?q?=E5=A4=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../cuda_kernels/fused_softmax_mask_grad_kernel_register.cu | 2 +- .../kernels/fusion/fused_softmax_mask_grad_kernel_register.cu | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu index 0bb64afd52e..800a8c3f23d 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_softmax_mask_grad_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/kernels/full_kernel.h" -#include "paddle/phi/kernels/fusion/gpu/fused_softmax_mask_grad_kernel.cu" // NOLINT +#include "paddle/phi/kernels/fused_softmax_mask_grad_kernel.h" #include "paddle/phi/kernels/fusion/gpu/fused_softmax_mask_utils.h" PD_CUSTOM_KERNEL_REGISTER(fused_softmax_mask_grad, diff --git a/backends/metax_gpu/kernels/fusion/fused_softmax_mask_grad_kernel_register.cu b/backends/metax_gpu/kernels/fusion/fused_softmax_mask_grad_kernel_register.cu index 55883496a72..2c596c6a4eb 100644 --- a/backends/metax_gpu/kernels/fusion/fused_softmax_mask_grad_kernel_register.cu +++ b/backends/metax_gpu/kernels/fusion/fused_softmax_mask_grad_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/kernels/full_kernel.h" -#include "paddle/phi/kernels/fusion/gpu/fused_softmax_mask_grad_kernel.cu" // NOLINT +#include "paddle/phi/kernels/fused_softmax_mask_grad_kernel.h" #include "paddle/phi/kernels/fusion/gpu/fused_softmax_mask_utils.h" PD_CUSTOM_KERNEL_REGISTER(fused_softmax_mask_grad, From 60b87612e884da843b293c47cb0b1b8ae078dc12 Mon Sep 17 00:00:00 2001 From: wangjiabao <204268140@qq.com> Date: Sat, 27 Sep 2025 20:05:35 +0800 Subject: [PATCH 3/3] =?UTF-8?q?=E3=80=90CUDA=20Kernel=20No.9=E3=80=91fused?= =?UTF-8?q?=5Fsoftmax=5Fmask=5Fgrad=E7=AE=97=E5=AD=90Kernel=E4=BF=AE?= =?UTF-8?q?=E5=A4=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu | 2 +- .../kernels/fusion/fused_seqpool_cvm_kernel_register.cu | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu index 88c3ad47461..040aadaddbd 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/fused_seqpool_cvm_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/core/mixed_vector.h" -#include "paddle/phi/kernels/fused_seqpool_cvm_kernel.h" +#include "paddle/phi/kernels/fusion/gpu/fused_seqpool_cvm_kernel.cu" //NOLINT PD_CUSTOM_KERNEL_REGISTER(fused_seqpool_cvm, iluvatar_gpu, diff --git a/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu b/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu index 5b552b6298d..2505a742a06 100644 --- a/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu +++ b/backends/metax_gpu/kernels/fusion/fused_seqpool_cvm_kernel_register.cu @@ -14,7 +14,7 @@ #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/core/mixed_vector.h" -#include "paddle/phi/kernels/fused_seqpool_cvm_kernel.h" +#include "paddle/phi/kernels/fusion/gpu/fused_seqpool_cvm_kernel.cu" //NOLINT PD_CUSTOM_KERNEL_REGISTER(fused_seqpool_cvm, metax_gpu,