From e119f240bd512b75e760e0ae8ca6fdc451b1790f Mon Sep 17 00:00:00 2001 From: youge325 Date: Fri, 3 Oct 2025 19:46:10 +0800 Subject: [PATCH] =?UTF-8?q?=E3=80=90CUDA=20Kernel=20No.12=E3=80=91fused=5F?= =?UTF-8?q?stack=5Ftranspose=5Fquant=5Fkernel=E7=AE=97=E5=AD=90Kernel?= =?UTF-8?q?=E4=BF=AE=E5=A4=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../gpu/fused_stack_transpose_quant_kernel.cu | 1 + .../gpu/fused_stack_transpose_quant_kernel.h | 36 +++++++++++++++++++ 2 files changed, 37 insertions(+) create mode 100644 paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h diff --git a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu index 6afce7eac9a300..6b2fa29fb67c1d 100644 --- a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu +++ b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.cu @@ -12,6 +12,7 @@ // See the License for the specific language governing permissions and // limitations under the License. +#include "paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h" #include "paddle/phi/backends/gpu/gpu_context.h" #include "paddle/phi/core/dense_tensor.h" #include "paddle/phi/core/kernel_registry.h" diff --git a/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h new file mode 100644 index 00000000000000..0dd685305c74a7 --- /dev/null +++ b/paddle/phi/kernels/fusion/gpu/fused_stack_transpose_quant_kernel.h @@ -0,0 +1,36 @@ +// Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +#pragma once + +#include +#include "paddle/phi/core/dense_tensor.h" + +namespace phi { +namespace fusion { + +template +void FusedStackQuantKernel(const Context& dev_ctx, + const std::vector& x, + DenseTensor* out, + DenseTensor* scale); + +template +void FusedStackTransposeQuantKernel(const Context& dev_ctx, + const std::vector& x, + DenseTensor* out, + DenseTensor* scale); + +} // namespace fusion +} // namespace phi