From e119f240bd512b75e760e0ae8ca6fdc451b1790f Mon Sep 17 00:00:00 2001
From: youge325 <A372707325@126.com>
Date: Fri, 3 Oct 2025 19:46:10 +0800
Subject: [PATCH] =?UTF-8?q?=E3=80=90CUDA=20Kernel=20No.12=E3=80=91fused=5F?=
 =?UTF-8?q?stack=5Ftranspose=5Fquant=5Fkernel=E7=AE=97=E5=AD=90Kernel?=
 =?UTF-8?q?=E4=BF=AE=E5=A4=8D?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .../gpu/fused_stack_transpose_quant_kernel.cu |  1 +
 .../gpu/fused_stack_transpose_quant_kernel.h  | 36 +++++++++++++++++++
 2 files changed, 37 insertions(+)
 create mode 100644 paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h
diff --git a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu
index 6afce7eac9a300..6b2fa29fb67c1d 100644
--- a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu
+++ b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu
@@ -12,6 +12,7 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+#include "paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h"
 #include "paddle/phi/backends/gpu/gpu_context.h"
 #include "paddle/phi/core/dense_tensor.h"
 #include "paddle/phi/core/kernel_registry.h"
diff --git a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h
new file mode 100644
index 00000000000000..0dd685305c74a7
--- /dev/null
+++ b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h
@@ -0,0 +1,36 @@
+// Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include <vector>
+#include "paddle/phi/core/dense_tensor.h"
+
+namespace phi {
+namespace fusion {
+
+template <typename T, typename Context>
+void FusedStackQuantKernel(const Context& dev_ctx,
+                           const std::vector<const DenseTensor*>& x,
+                           DenseTensor* out,
+                           DenseTensor* scale);
+
+template <typename T, typename Context>
+void FusedStackTransposeQuantKernel(const Context& dev_ctx,
+                                    const std::vector<const DenseTensor*>& x,
+                                    DenseTensor* out,
+                                    DenseTensor* scale);
+
+}  // namespace fusion
+}  // namespace phi