File tree Expand file tree Collapse file tree 5 files changed +21
-7
lines changed
.ci/docker/ci_commit_pins
runtime/core/portable_type/c10/c10 Expand file tree Collapse file tree 5 files changed +21
-7
lines changed Original file line number Diff line number Diff line change 1- 59d5cf083b4f860dea76fe8936076177f9367f10
1+ 01f1cc44cbbfdf6307aa01b803a4ee22f9ade946
Original file line number Diff line number Diff line change @@ -35,7 +35,11 @@ set(XNNPACK_BUILD_TESTS
3535set (XNNPACK_ENABLE_AVXVNNI
3636 OFF
3737 CACHE BOOL ""
38- )
38+ )
39+ # Work around observed failure: https://github.com/pytorch/executorch/pull/10362#issuecomment-2906391232
40+ set (XNNPACK_ENABLE_AVX512VNNIGFNI
41+ OFF
42+ CACHE BOOL "" )
3943
4044if (EXECUTORCH_XNNPACK_ENABLE_KLEIDI)
4145 set (XNNPACK_ENABLE_KLEIDIAI
Original file line number Diff line number Diff line change @@ -71,7 +71,7 @@ def python_is_compatible():
7171#
7272# NOTE: If you're changing, make the corresponding change in .ci/docker/ci_commit_pins/pytorch.txt
7373# by picking the hash from the same date in https://hud.pytorch.org/hud/pytorch/pytorch/nightly/
74- NIGHTLY_VERSION = "dev20250524 "
74+ NIGHTLY_VERSION = "dev20250422 "
7575
7676
7777def install_requirements (use_pytorch_nightly ):
Original file line number Diff line number Diff line change @@ -508,4 +508,14 @@ __host__ __device__
508508
509509#endif
510510
511+ // This macro is used to find older C++ compilers
512+ // that don't support move optimization for return values.
513+
514+ #if (defined(__GNUC__) && __GNUC__ < 13) || \
515+ (defined (__clang_major__) && __clang_major__ < 13 )
516+ #define C10_RETURN_MOVE_IF_OLD_COMPILER 1
517+ #else
518+ #define C10_RETURN_MOVE_IF_OLD_COMPILER 0
519+ #endif
520+
511521#endif // C10_MACROS_MACROS_H_
Original file line number Diff line number Diff line change @@ -31,7 +31,7 @@ inline C10_HOST_DEVICE float f32_from_bits(uint16_t src) {
3131 uint32_t tmp = src;
3232 tmp <<= 16 ;
3333
34- #if defined(USE_ROCM)
34+ #if defined(USE_ROCM) && defined(__HIPCC__)
3535 float * tempRes;
3636
3737 // We should be using memcpy in order to respect the strict aliasing rule
@@ -48,7 +48,7 @@ inline C10_HOST_DEVICE float f32_from_bits(uint16_t src) {
4848inline C10_HOST_DEVICE uint16_t bits_from_f32 (float src) {
4949 uint32_t res = 0 ;
5050
51- #if defined(USE_ROCM)
51+ #if defined(USE_ROCM) && defined(__HIPCC__)
5252 // We should be using memcpy in order to respect the strict aliasing rule
5353 // but it fails in the HIP environment.
5454 uint32_t * tempRes = reinterpret_cast <uint32_t *>(&src);
@@ -61,7 +61,7 @@ inline C10_HOST_DEVICE uint16_t bits_from_f32(float src) {
6161}
6262
6363inline C10_HOST_DEVICE uint16_t round_to_nearest_even (float src) {
64- #if defined(USE_ROCM)
64+ #if defined(USE_ROCM) && defined(__HIPCC__)
6565 if (src != src) {
6666#elif defined(_MSC_VER)
6767 if (isnan (src)) {
@@ -87,7 +87,7 @@ struct alignas(2) BFloat16 {
8787 uint16_t x;
8888
8989 // HIP wants __host__ __device__ tag, CUDA does not
90- #if defined(USE_ROCM)
90+ #if defined(USE_ROCM) && defined(__HIPCC__)
9191 C10_HOST_DEVICE BFloat16 () = default ;
9292#else
9393 BFloat16 () = default ;
You can’t perform that action at this time.
0 commit comments