11#include " kernel_operator.h"
22
3- #include < cmath>
4-
53using namespace AscendC ;
64
75#define BUFFER_NUM 2
@@ -183,7 +181,7 @@ extern "C" __global__ __aicore__ void ascendc_dup_by_rows_fp32(
183181 copy_to_ub (output_ne_gm, output_ne_ub, 32 );
184182 copy_to_ub (output_nb_gm, output_nb_ub, 32 );
185183
186- DupByRows<float_t , float_t > op;
184+ DupByRows<float , float > op;
187185 op.init (src_gm, dst_gm, input_ne_ub, input_nb_ub);
188186 op.dup ();
189187}
@@ -206,7 +204,7 @@ extern "C" __global__ __aicore__ void ascendc_dup_by_rows_fp32_to_fp16(
206204 copy_to_ub (output_ne_gm, output_ne_ub, 32 );
207205 copy_to_ub (output_nb_gm, output_nb_ub, 32 );
208206
209- DupByRows<float_t , half> op;
207+ DupByRows<float , half> op;
210208 op.init (src_gm, dst_gm, input_ne_ub, input_nb_ub);
211209 op.dup_with_cast ();
212210}
@@ -230,7 +228,7 @@ extern "C" __global__ __aicore__ void ascendc_dup_by_rows_fp16_to_fp32(
230228 copy_to_ub (output_ne_gm, output_ne_ub, 32 );
231229 copy_to_ub (output_nb_gm, output_nb_ub, 32 );
232230
233- DupByRows<half, float_t > op;
231+ DupByRows<half, float > op;
234232 op.init (src_gm, dst_gm, input_ne_ub, input_nb_ub);
235233 op.dup_with_cast ();
236234}
0 commit comments