@@ -111,6 +111,7 @@ file(
111
111
${PADDLE_SOURCE_DIR} /paddle/phi/backends/gpu/cuda/cuda_graph.cc
112
112
# Core
113
113
${PADDLE_SOURCE_DIR} /paddle/phi/core/enforce.cc
114
+ ${PADDLE_SOURCE_DIR} /paddle/phi/core/mixed_vector.cc
114
115
${PADDLE_SOURCE_DIR} /paddle/phi/backends/dynload/cusparse.cc
115
116
# kernels/Funcs
116
117
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/*.cu
@@ -163,13 +164,11 @@ file(
163
164
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/diag_grad_kernel.cu
164
165
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/einsum_kernel.cu
165
166
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/einsum_grad_kernel.cu
166
- ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/elementwise_grad_kernel.cu
167
167
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/decode_jpeg_kernel.cu
168
168
${PADDLE_SOURCE_DIR} /paddle/phi/backends/dynload/nvjpeg.cc
169
169
${PADDLE_SOURCE_DIR} /paddle/phi/backends/dynload/cupti.cc
170
170
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/embedding_kernel.cu
171
171
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/embedding_grad_kernel.cu
172
- ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/embedding_with_scaled_gradient_grad_kernel_register.cu
173
172
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/expand_kernel.cu
174
173
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/expand_grad_kernel.cu
175
174
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/expand_as_grad_kernel.cu
@@ -239,6 +238,8 @@ file(
239
238
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/where_grad_kernel.cu
240
239
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/where_kernel.cu
241
240
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/empty_kernel.cc
241
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/lerp_grad_kernel.cu
242
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/lerp_kernel.cu
242
243
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/flatten_kernel.cc
243
244
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/flatten_grad_kernel.cc
244
245
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/reduce_all_kernel.cc
@@ -406,7 +407,6 @@ file(
406
407
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/radam_kernel.cu
407
408
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/random_routing_kernel.cu
408
409
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/renorm_grad_kernel.cu
409
- ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/rmsprop_kernel.cu
410
410
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/scale_kernel.cu
411
411
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/randperm_kernel.cu
412
412
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/reduce_as_grad_kernel.cu
@@ -461,8 +461,10 @@ file(
461
461
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unfold_kernel.cu
462
462
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unfold_grad_kernel.cu
463
463
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unpool_kernel.cu
464
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/lstsq_kernel.cu
464
465
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unpool_grad_kernel.cu
465
466
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unstack_grad_kernel_register.cu
467
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/stack_grad_kernel.cu
466
468
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/unstack_kernel.cu
467
469
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/viterbi_decode_kernel.cu
468
470
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/warprnnt_grad_kernel.cu
@@ -473,6 +475,7 @@ file(
473
475
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gammaincc_kernel.cu
474
476
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gammaincc_grad_kernel.cu
475
477
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/llm_int8_linear_kernel.cu
478
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/baddbmm_kernel.cu
476
479
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/baddbmm_grad_kernel.cu
477
480
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/load_kernel.cu
478
481
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/load_combine_kernel.cu
@@ -481,6 +484,13 @@ file(
481
484
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/save_kernel.cu
482
485
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/dropout_kernel.cu
483
486
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/dropout_grad_kernel.cu
487
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/index_add_grad_kernel.cu
488
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/bce_loss_kernel.cu
489
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/bce_loss_grad_kernel.cu
490
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/meshgrid_kernel.cu.cc
491
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/meshgrid_grad_kernel.cu.cc
492
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/pad3d_grad_kernel.cu
493
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/pad3d_kernel.cu
484
494
# ############################################################################
485
495
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/array_grad_kernel.cc
486
496
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/set_kernel.cc
@@ -547,6 +557,7 @@ file(
547
557
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/sparse/gpu/sync_batch_norm_kernel.cu
548
558
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/sparse/gpu/unary_grad_kernel.cu
549
559
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/sparse/gpu/sum_grad_kernel.cu
560
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/transfer_layout_kernel.cc
550
561
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/sparse/gpu/elementwise_grad_kernel.cu
551
562
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/sparse/gpu/mask_kernel.cu
552
563
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/legacy/gpu/ext_build_src_rank_and_local_expert_id_kernel.cu
@@ -595,8 +606,39 @@ file(
595
606
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/fusion/gpu/fused_swiglu_weighted_bwd_kernel.cu
596
607
${PADDLE_SOURCE_DIR} /paddle/phi/core/flags.cc
597
608
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/math_function.cc
609
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/log_softmax_kernel.cu
610
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/log_softmax_grad_kernel.cu
598
611
# ${PADDLE_SOURCE_DIR}/paddle/phi/backends/context_pool.cc
599
612
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/repeat_tensor2index_tensor.cu
613
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/binomial_kernel.cu
614
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/bernoulli_kernel.cu
615
+ # ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/bmm_grad_kernel_impl.h
616
+ # ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/bmm_kernel.cu
617
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/box_coder_kernel.cu
618
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/broadcast_tensors_kernel.cu
619
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/broadcast_tensors_grad_kernel.cu
620
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/channel_shuffle_grad_kernel.cu
621
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/channel_shuffle_kernel.cu
622
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/complex_grad_kernel.cu
623
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/complex_kernel.cu
624
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/cum_maxmin_grad_kernel.cu
625
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/cum_maxmin_kernel.cu
626
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/digamma_kernel.cu
627
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/digamma_grad_kernel.cu
628
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/dot_kernel.cu
629
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/dot_grad_kernel.cu
630
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/eigh_grad_kernel.cu
631
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/eigvalsh_grad_kernel.cu
632
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/exponential_kernel.cu
633
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/flip_kernel.cu
634
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gammaincc_grad_kernel.cu
635
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gather_tree_kernel.cu
636
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/graph_reindex_kernel.cu
637
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/graph_sample_neighbors_kernel.cu
638
+ # ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/gpu/group_norm_kernel.cu
639
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/group_norm_grad_kernel.cu
640
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gumbel_softmax_grad_kernel.cu
641
+ ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/gpu/gumbel_softmax_kernel.cu
600
642
# ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/fusion/gpu/fused_act_dequant_kernel.cu
601
643
# ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/fusion/gpu/block_multi_head_attention_kernel.cu
602
644
# ${PADDLE_SOURCE_DIR}/paddle/phi/kernels/fusion/gpu/fused_weighted_swiglu_act_quant_kernel.cu
@@ -627,7 +669,6 @@ file(
627
669
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/kps/reduce_kernel.cu
628
670
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/legacy/kps/reduce_max_kernel.cu
629
671
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/array_kernel.cc
630
- ${CMAKE_SOURCE_DIR} /kernels/funcs/blas/cublas.cc
631
672
${CMAKE_SOURCE_DIR} /kernels/gpudnn/cudnn.cc
632
673
${CMAKE_SOURCE_DIR} /kernels/metax_context.cc
633
674
${CMAKE_SOURCE_DIR} /kernels/cross_entropy_kernel_register.cu
@@ -642,8 +683,6 @@ list(
642
683
REMOVE_ITEM
643
684
CUDA_SRCS
644
685
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/gru_compute.cu
645
- ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/matrix_solve.cu
646
- ${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/matrix_inverse.cu
647
686
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/multihead_matmul_functor.cu
648
687
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/softmax.cu
649
688
${PADDLE_SOURCE_DIR} /paddle/phi/kernels/funcs/weight_only_gemv.cu
@@ -672,6 +711,7 @@ file(
672
711
kernels/gpudnn/*.cu
673
712
kernels/cuda_kernels/*.cc
674
713
kernels/cuda_kernels/*.cu
714
+ kernels/funcs/blas/*.cc
675
715
kernels/ernie_core/*.cu
676
716
kernels/ernie_core/rms_norm_kernel_register.cu
677
717
kernels/ernie_core/top_p_sampling_kernel_register.cu
0 commit comments