From 6697eadca3db3efc12f78d027408772130fe1945 Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Fri, 26 Sep 2025 18:12:34 +0800 Subject: [PATCH 1/8] Update distributed_fused_lamb_init_kernel_register.cu MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换引用的.cu文件 --- .../cuda_kernels/distributed_fused_lamb_init_kernel_register.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu b/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu index 9d4d57e9e5d..df1b1cc7335 100644 --- a/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu +++ b/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu @@ -16,7 +16,7 @@ #include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" #include "paddle/phi/kernels/funcs/algorithm.h" #include "paddle/phi/kernels/fusion/gpu/cast_with_ptr.h" -#include "paddle/phi/kernels/fusion/gpu/distributed_fused_lamb_init_kernel.cu" //NOLINT +#include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, metax_gpu, From 91b1de23e33abde4c2d45b45c3517534902933c1 Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Fri, 26 Sep 2025 18:13:06 +0800 Subject: [PATCH 2/8] Update distributed_fused_lamb_init_kernel_register.cu MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换引用的.cu文件 --- .../cuda_kernels/distributed_fused_lamb_init_kernel_register.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu index 49e4eb84ad8..f6f3402b647 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu @@ -16,7 +16,7 @@ #include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" #include "paddle/phi/kernels/funcs/algorithm.h" #include "paddle/phi/kernels/fusion/gpu/cast_with_ptr.h" -#include "paddle/phi/kernels/fusion/gpu/distributed_fused_lamb_init_kernel.cu" //NOLINT +#include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, iluvatar_gpu, From 6b41c648a59c5423aa2690e0a42ba94276e0c3f0 Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Fri, 26 Sep 2025 18:19:18 +0800 Subject: [PATCH 3/8] Update fused_bias_act_kernel_register.cu MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换引用的.cu文件 --- .../kernels/ernie_core/fused_bias_act_kernel_register.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu b/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu index 9345cb0a291..35af5740a59 100644 --- a/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu +++ b/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu @@ -14,7 +14,7 @@ // limitations under the License. #include "paddle/phi/core/kernel_registry.h" -#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_kernel.cu" //NOLINT +#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_utils.h" PD_CUSTOM_KERNEL_REGISTER(fused_bias_act, metax_gpu, From d7fffd0aa3b276cf3dfbaf7971bd572af4c88965 Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Fri, 26 Sep 2025 18:19:40 +0800 Subject: [PATCH 4/8] Update fused_bias_act_kernel_register.cc MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换引用的.cu文件 --- .../kernels/ernie_core/fused_bias_act_kernel_register.cc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc b/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc index b7920534ed1..a08c4fb956e 100644 --- a/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc @@ -13,7 +13,7 @@ // limitations under the License. #include "paddle/phi/core/kernel_registry.h" -#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_kernel.cu" //NOLINT +#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_utils.h" PD_CUSTOM_KERNEL_REGISTER(fused_bias_act, iluvatar_gpu, From 59b57c2a72cc46165164003ec6c08ccfe894110d Mon Sep 17 00:00:00 2001 From: Le-soleile <3516093767@qq.com> Date: Sun, 28 Sep 2025 05:51:46 +0000 Subject: [PATCH 5/8] Style --- .../distributed_fused_lamb_init_kernel_register.cu | 14 ++++++++------ .../distributed_fused_lamb_init_kernel_register.cu | 1 - 2 files changed, 8 insertions(+), 7 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu index f6f3402b647..42c52c94c9a 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu @@ -16,13 +16,15 @@ #include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" #include "paddle/phi/kernels/funcs/algorithm.h" #include "paddle/phi/kernels/fusion/gpu/cast_with_ptr.h" -#include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" -PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, - iluvatar_gpu, - ALL_LAYOUT, - phi::fusion::DistributedFusedLambInitOpKernel, - float) { +backends / iluvatar_gpu / kernels / ernie_core / + fused_bias_act_kernel_register.cc + + PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, + iluvatar_gpu, + ALL_LAYOUT, + phi::fusion::DistributedFusedLambInitOpKernel, + float) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT16); diff --git a/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu b/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu index df1b1cc7335..97ad0c25596 100644 --- a/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu +++ b/backends/metax_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu @@ -16,7 +16,6 @@ #include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" #include "paddle/phi/kernels/funcs/algorithm.h" #include "paddle/phi/kernels/fusion/gpu/cast_with_ptr.h" -#include "paddle/phi/kernels/distributed_fused_lamb_init_kernel.h" PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, metax_gpu, From fbc160c080ef286fa220ceac9cdaa3bde292f694 Mon Sep 17 00:00:00 2001 From: Le-soleile <3516093767@qq.com> Date: Sun, 28 Sep 2025 06:43:54 +0000 Subject: [PATCH 6/8] change #include --- .../distributed_fused_lamb_init_kernel_register.cu | 13 +++++-------- 1 file changed, 5 insertions(+), 8 deletions(-) diff --git a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu index 42c52c94c9a..13516a5e0c9 100644 --- a/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu +++ b/backends/iluvatar_gpu/kernels/cuda_kernels/distributed_fused_lamb_init_kernel_register.cu @@ -17,14 +17,11 @@ #include "paddle/phi/kernels/funcs/algorithm.h" #include "paddle/phi/kernels/fusion/gpu/cast_with_ptr.h" -backends / iluvatar_gpu / kernels / ernie_core / - fused_bias_act_kernel_register.cc - - PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, - iluvatar_gpu, - ALL_LAYOUT, - phi::fusion::DistributedFusedLambInitOpKernel, - float) { +PD_CUSTOM_KERNEL_REGISTER(distributed_fused_lamb_init, + iluvatar_gpu, + ALL_LAYOUT, + phi::fusion::DistributedFusedLambInitOpKernel, + float) { kernel->OutputAt(0).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(1).SetDataType(phi::DataType::FLOAT32); kernel->OutputAt(2).SetDataType(phi::DataType::FLOAT16); From 087292cae189e71b761f8e1ad0b40dbb8d8fff6b Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Mon, 29 Sep 2025 16:18:08 +0800 Subject: [PATCH 7/8] Update fused_bias_act_kernel_register.cu MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换错误的引用 --- .../kernels/ernie_core/fused_bias_act_kernel_register.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu b/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu index 35af5740a59..c49ceed2196 100644 --- a/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu +++ b/backends/metax_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cu @@ -14,7 +14,7 @@ // limitations under the License. #include "paddle/phi/core/kernel_registry.h" -#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_utils.h" +#include "paddle/phi/kernels/fused_bias_act_kernel.h" PD_CUSTOM_KERNEL_REGISTER(fused_bias_act, metax_gpu, From b64b9ddc299128d9077afe4692b965986cd8bbbb Mon Sep 17 00:00:00 2001 From: Yami <156195357+Le-soleile@users.noreply.github.com> Date: Mon, 29 Sep 2025 16:18:52 +0800 Subject: [PATCH 8/8] Update fused_bias_act_kernel_register.cc MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 替换错误的引用 --- .../kernels/ernie_core/fused_bias_act_kernel_register.cc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc b/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc index a08c4fb956e..24c7d3e1711 100644 --- a/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc +++ b/backends/iluvatar_gpu/kernels/ernie_core/fused_bias_act_kernel_register.cc @@ -13,7 +13,7 @@ // limitations under the License. #include "paddle/phi/core/kernel_registry.h" -#include "paddle/phi/kernels/fusion/gpu/fused_bias_act_utils.h" +#include "paddle/phi/kernels/fused_bias_act_kernel.h" PD_CUSTOM_KERNEL_REGISTER(fused_bias_act, iluvatar_gpu,