1 file changed
+1
-1
lines changed- README.md+1-1
- README_cn.md+1-1
- README_ja.md+1-1
- cmake/external/xpu.cmake+1-1
- paddle/ap/include/axpr/builtin_functions.h-3
- paddle/ap/include/axpr/global_environment.h+1-1
- paddle/cinn/ir/intrinsic_ops.h+1-1
- paddle/fluid/eager/auto_code_generator/generator/eager_gen.py+2
- paddle/phi/api/lib/api_gen_utils.cc+1-1
- paddle/phi/api/lib/kernel_dispatch.h+6-6
- paddle/phi/backends/dynload/nvtx.h+4-1
- paddle/phi/kernels/funcs/activation_functor.h+52-1
- paddle/phi/kernels/funcs/correlation_funcs.cu.h+28-23
- paddle/phi/kernels/funcs/fused_gemm_epilogue_xpu.h+2-6
- paddle/phi/kernels/funcs/multihead_matmul_functor.cu+3-6
- paddle/phi/kernels/fusion/gpu/multihead_matmul_kernel.cu+1-1
- paddle/phi/kernels/fusion/gpu/skip_layernorm_kernel.cu+1-1
- paddle/phi/kernels/fusion/xpu/fused_feedforward_grad_kernel.cc-1
- paddle/phi/kernels/gpu/correlation_grad_kernel.cu+124-131
- paddle/phi/kernels/gpu/correlation_kernel.cu+81-57
- paddle/phi/kernels/stride/matmul_stride_kernel.cu+243
- paddle/phi/kernels/xpu/activation_grad_kernel.cc+9-1
- paddle/utils/any.h+9-6
- python/paddle/__init__.py+1
- python/paddle/base/executor.py+1-1
- python/paddle/cuda/__init__.py+327-47
- python/paddle/device/__init__.py+215-11
- python/paddle/device/cpu_device.py+109
- python/paddle/device/cuda/__init__.py+57
- python/paddle/device/custom_device.py+59
- python/paddle/device/xpu/__init__.py+56
- python/paddle/distributed/auto_parallel/api.py+1-1
- python/paddle/distributed/fleet/meta_optimizers/dygraph_optimizer/dygraph_sharding_optimizer.py+1
- python/paddle/distributed/fleet/meta_parallel/__init__.py+1
- python/paddle/distributed/fleet/meta_parallel/pipeline_parallel.py+16
- python/paddle/framework/dtype.py+3-3
- python/paddle/framework/random.py+1-1
- python/paddle/optimizer/adamw.py+1
- python/paddle/sparse/creation.py+2-2
- python/paddle/tensor/creation.py+15-23
- python/paddle/tensor/manipulation.py+3-6
- python/paddle/tensor/random.py+2-2
- test/collective/fleet/hybrid_parallel_pp_transformer.py+34-3
- test/compat/test_device_apis.py+3
- test/compat/test_get_device_module.py+79
- test/compat/test_paddle_cuda_apis.py+468
- test/compat/test_rng_state.py+76
- test/contrib/test_correlation.py+83
- test/cpp/fluid/CMakeLists.txt+1-1
- test/cpp/fluid/onednn/CMakeLists.txt
- test/cpp/fluid/onednn/test_conv_onednn_nhwc.cc
- test/cpp/fluid/onednn/test_onednn_caching.cc
- test/cpp/fluid/onednn/test_onednn_conv2d_transpose_bias.cc
- test/cpp/fluid/onednn/test_onednn_cpu_quantize_pass.cc
- test/cpp/fluid/onednn/test_onednn_op_inplace.cc
- test/cpp/fluid/onednn/test_onednn_op_nhwc.cc
- test/cpp/fluid/onednn/test_onednn_pool_adaptive_op.cc
- test/cpp/fluid/onednn/test_onednn_squeeze.cc
- test/deprecated/cpp/inference/api/analyzer_detect_functional_onednn_tester_deprecated.cc
- test/flex_checkpoint/CMakeLists.txt+4
- test/flex_checkpoint/sharded_state_dict_logic.py+192-14
- test/flex_checkpoint/test_sharded_state_dict.py+62-2
- test/ir/inference/CMakeLists.txt+15-15
- test/ir/inference/test_onednn_conv3d_bias_fuse_pass.py+2-2
- test/ir/inference/test_onednn_conv3d_op.py
- test/ir/inference/test_onednn_conv_affine_channel_fuse_pass.py
- test/ir/inference/test_onednn_conv_gelu_fuse_pass.py
- test/ir/inference/test_onednn_conv_mish_fuse_pass.py
- test/ir/inference/test_onednn_conv_transpose_bias_fuse_pass.py
- test/ir/inference/test_onednn_mish_op.py+1-1
- test/ir/inference/test_onednn_prelu_op.py+1-1
- test/ir/inference/test_onednn_shape_op.py+1-1
- test/ir/inference/test_onednn_shuffle_channel_op.py+1-1
- test/legacy_test/test_adadelta_op.py+3-5
- test/legacy_test/test_adam_optimizer_fp32_fp64.py+3-5
- test/legacy_test/test_cuda_unittest.py+29-19
- test/legacy_test/test_dropout_op.py+4-13
- test/legacy_test/test_logical_op.py+1-8
- test/legacy_test/test_memcpy_op.py+17-9
- test/legacy_test/test_momentum_op.py+8-12
- test/legacy_test/test_network_with_dtype.py+4-5
- test/legacy_test/test_rmsprop_op.py+3-5
- test/mkldnn/test_elementwise_add_bf16_onednn_op.py+3-3
- test/mkldnn/test_expand_v2_onednn_op.py+1-1
- test/mkldnn/test_fc_bf16_onednn_op.py+2-2
- test/mkldnn/test_matmul_bf16_onednn_op.py
- test/mkldnn/test_matmul_v2_onednn_op.py+1
- test/mkldnn/test_nearest_interp_v2_onednn_op.py
- tools/parallel_UT_rule.py+5-5
- tools/static_mode_white_list.py+4-4
- tools/windows/run_unittests.sh+4-4
0 commit comments