Skip to content

Commit fde5d76

Browse files
authored
Merge branch 'main' into new-fix-vnni-types
2 parents e259ce4 + 349544d commit fde5d76

File tree

196 files changed

+110360
-7555
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

196 files changed

+110360
-7555
lines changed

.ci/all_requirements.txt

Lines changed: 3 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -194,9 +194,9 @@ ml-dtypes==0.5.1 ; python_version < "3.13" \
194194
--hash=sha256:d13755f8e8445b3870114e5b6240facaa7cb0c3361e54beba3e07fa912a6e12b \
195195
--hash=sha256:fd918d4e6a4e0c110e2e05be7a7814d10dc1b95872accbf6512b80a109b71ae1
196196
# via -r mlir/python/requirements.txt
197-
nanobind==2.9.2 \
198-
--hash=sha256:c37957ffd5eac7eda349cff3622ecd32e5ee1244ecc912c99b5bc8188bafd16e \
199-
--hash=sha256:e7608472de99d375759814cab3e2c94aba3f9ec80e62cfef8ced495ca5c27d6e
197+
nanobind==2.7.0 \
198+
--hash=sha256:73b12d0e751d140d6c1bf4b215e18818a8debfdb374f08dc3776ad208d808e74 \
199+
--hash=sha256:f9f1b160580c50dcf37b6495a0fd5ec61dc0d95dae5f8004f87dd9ad7eb46b34
200200
# via -r mlir/python/requirements.txt
201201
numpy==2.0.2 \
202202
--hash=sha256:0123ffdaa88fa4ab64835dcbde75dcdf89c453c922f18dced6e27c90d1d0ec5a \
@@ -383,10 +383,6 @@ swig==4.3.1 \
383383
--hash=sha256:efec16327029f682f649a26da726bb0305be8800bd0f1fa3e81bf0769cf5b476 \
384384
--hash=sha256:fc496c0d600cf1bb2d91e28d3d6eae9c4301e5ea7a0dec5a4281b5efed4245a8
385385
# via -r lldb/test/requirements.txt
386-
typing-extensions==4.15.0 \
387-
--hash=sha256:0cea48d173cc12fa28ecabc3b837ea3cf6f38c6d1136f85cbaaf598984861466 \
388-
--hash=sha256:f0fa19c6845758ab08074a0cfa8b7aecb71c999ca73d62883bc25cc018c4e548
389-
# via -r mlir/python/requirements.txt
390386
urllib3==2.5.0 \
391387
--hash=sha256:3fc47733c7e419d4bc3f6b3dc2b4f890bb743906a30d56ba4a5bfa4bbff92760 \
392388
--hash=sha256:e6b01673c0fa6a13e374b50871808eb3bf7046c4b125b216f6bf1cc604cff0dc

.github/new-prs-labeler.yml

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1090,6 +1090,14 @@ clang:openmp:
10901090
- llvm/unittests/Frontend/OpenMP*
10911091
- llvm/test/Transforms/OpenMP/**
10921092

1093+
clang:temporal-safety:
1094+
- clang/include/clang/Analysis/Analyses/LifetimeSafety*
1095+
- clang/lib/Analysis/LifetimeSafety*
1096+
- clang/unittests/Analysis/LifetimeSafety*
1097+
- clang/test/Sema/*lifetime-safety*
1098+
- clang/test/Sema/*lifetime-analysis*
1099+
- clang/test/Analysis/LifetimeSafety/**
1100+
10931101
clang:as-a-library:
10941102
- clang/tools/libclang/**
10951103
- clang/bindings/**

clang/lib/Analysis/LiveVariables.cpp

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -72,15 +72,17 @@ bool LiveVariables::LivenessValues::isLive(const Expr *E) const {
7272

7373
bool LiveVariables::LivenessValues::isLive(const VarDecl *D) const {
7474
if (const auto *DD = dyn_cast<DecompositionDecl>(D)) {
75-
bool alive = false;
76-
for (const BindingDecl *BD : DD->bindings())
77-
alive |= liveBindings.contains(BD);
78-
7975
// Note: the only known case this condition is necessary, is when a bindig
8076
// to a tuple-like structure is created. The HoldingVar initializers have a
8177
// DeclRefExpr to the DecompositionDecl.
82-
alive |= liveDecls.contains(DD);
83-
return alive;
78+
if (liveDecls.contains(DD))
79+
return true;
80+
81+
for (const BindingDecl *BD : DD->bindings()) {
82+
if (liveBindings.contains(BD))
83+
return true;
84+
}
85+
return false;
8486
}
8587
return liveDecls.contains(D);
8688
}

compiler-rt/test/fuzzer/sig-trap.test

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ UNSUPPORTED: target={{.*windows.*}}
55
RUN: %cpp_compiler %S/SigTrapTest.cpp -o %t
66

77
RUN: not %run %t 2>&1 | FileCheck %s
8-
CHECK: BINGO
9-
CHECK: ERROR: libFuzzer: deadly signal
8+
CHECK-DAG: BINGO
9+
CHECK-DAG: ERROR: libFuzzer: deadly signal
1010

1111
RUN: trap "%run %t -handle_trap=0" TRAP

flang/lib/Utils/CMakeLists.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,8 @@ add_flang_library(FortranUtils
1717
LINK_LIBS
1818
FIRDialect
1919
FIRBuilder
20+
FortranEvaluate
21+
FortranSupport
2022
HLFIRDialect
2123

2224
MLIR_LIBS

libcxx/include/__memory/pointer_traits.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -255,7 +255,7 @@ concept __resettable_smart_pointer_with_args = requires(_Smart __s, _Pointer __p
255255
// This function ensures safe conversions between fancy pointers at compile-time, where we avoid casts from/to
256256
// `__void_pointer` by obtaining the underlying raw pointer from the fancy pointer using `std::to_address`,
257257
// then dereferencing it to retrieve the pointed-to object, and finally constructing the target fancy pointer
258-
// to that object using the `std::pointer_traits<>::pinter_to` function.
258+
// to that object using the `std::pointer_traits<>::pointer_to` function.
259259
template <class _PtrTo, class _PtrFrom>
260260
_LIBCPP_CONSTEXPR_SINCE_CXX20 _LIBCPP_HIDE_FROM_ABI _PtrTo __static_fancy_pointer_cast(const _PtrFrom& __p) {
261261
using __ptr_traits = pointer_traits<_PtrTo>;

libcxx/utils/cat_files.py

Lines changed: 0 additions & 51 deletions
This file was deleted.

llvm/docs/AMDGPUUsage.rst

Lines changed: 22 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -537,6 +537,8 @@ Every processor supports every OS ABI (see :ref:`amdgpu-os`) with the following
537537
- Packed
538538
work-item Add product
539539
IDs names.
540+
- Workgroup
541+
Clusters
540542

541543
=========== =============== ============ ===== ================= =============== =============== ======================
542544

@@ -768,9 +770,6 @@ For example:
768770
performant than code generated for XNACK replay
769771
disabled.
770772

771-
cu-stores TODO On GFX12.5, controls whether ``scope:SCOPE_CU`` stores may be used.
772-
If disabled, all stores will be done at ``scope:SCOPE_SE`` or greater.
773-
774773
=============== ============================ ==================================================
775774

776775
.. _amdgpu-target-id:
@@ -1098,6 +1097,22 @@ is conservatively correct for OpenCL.
10981097
- ``wavefront`` and executed by a thread in the
10991098
same wavefront.
11001099

1100+
``cluster`` Synchronizes with, and participates in modification
1101+
and seq_cst total orderings with, other operations
1102+
(except image operations) for all address spaces
1103+
(except private, or generic that accesses private)
1104+
provided the other operation's sync scope is:
1105+
1106+
- ``system``, ``agent`` or ``cluster`` and
1107+
executed by a thread on the same cluster.
1108+
- ``workgroup`` and executed by a thread in the
1109+
same work-group.
1110+
- ``wavefront`` and executed by a thread in the
1111+
same wavefront.
1112+
1113+
On targets that do not support workgroup cluster
1114+
launch mode, this behaves like ``agent`` scope instead.
1115+
11011116
``workgroup`` Synchronizes with, and participates in modification
11021117
and seq_cst total orderings with, other operations
11031118
(except image operations) for all address spaces
@@ -1131,6 +1146,9 @@ is conservatively correct for OpenCL.
11311146
``agent-one-as`` Same as ``agent`` but only synchronizes with other
11321147
operations within the same address space.
11331148

1149+
``cluster-one-as`` Same as ``cluster`` but only synchronizes with other
1150+
operations within the same address space.
1151+
11341152
``workgroup-one-as`` Same as ``workgroup`` but only synchronizes with
11351153
other operations within the same address space.
11361154

@@ -5114,9 +5132,7 @@ The fields used by CP for code objects before V3 also match those specified in
51145132
and must be 0,
51155133
>454 1 bit ENABLE_SGPR_PRIVATE_SEGMENT
51165134
_SIZE
5117-
455 1 bit USES_CU_STORES GFX12.5: Whether the ``cu-stores`` target attribute is enabled.
5118-
If 0, then all stores are ``SCOPE_SE`` or higher.
5119-
457:456 2 bits Reserved, must be 0.
5135+
457:455 3 bits Reserved, must be 0.
51205136
458 1 bit ENABLE_WAVEFRONT_SIZE32 GFX6-GFX9
51215137
Reserved, must be 0.
51225138
GFX10-GFX11
@@ -18254,8 +18270,6 @@ terminated by an ``.end_amdhsa_kernel`` directive.
1825418270
GFX942)
1825518271
``.amdhsa_user_sgpr_private_segment_size`` 0 GFX6-GFX12 Controls ENABLE_SGPR_PRIVATE_SEGMENT_SIZE in
1825618272
:ref:`amdgpu-amdhsa-kernel-descriptor-v3-table`.
18257-
``.amdhsa_uses_cu_stores`` 0 GFX12.5 Controls USES_CU_STORES in
18258-
:ref:`amdgpu-amdhsa-kernel-descriptor-v3-table`.
1825918273
``.amdhsa_wavefront_size32`` Target GFX10-GFX12 Controls ENABLE_WAVEFRONT_SIZE32 in
1826018274
Feature :ref:`amdgpu-amdhsa-kernel-descriptor-v3-table`.
1826118275
Specific

llvm/docs/QualGroup.rst

Lines changed: 23 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,8 @@
1+
.. CHANGE TRACKER for reference
2+
.. Purpose: Fixed document location and added Current Topics & Backlog
3+
.. Author: Carlos Andres Ramirez
4+
.. Last updated: 2025-09-08 by Carlos Ramirez
5+
16
========================
27
LLVM Qualification Group
38
========================
@@ -48,6 +53,20 @@ Participation is open to anyone interested. There are several ways to get involv
4853

4954
We welcome contributors from diverse backgrounds, organizations, and experience levels.
5055

56+
Current Topics & Backlog
57+
========================
58+
59+
Our working group is actively engaged in discussions about the project's
60+
direction and tackling technical challenges. You can find our current
61+
discussions, challenges, and the project backlog in the following
62+
document.
63+
64+
`Backlog document <https://docs.google.com/document/d/10YZZ72ba09Ck_OiJaP9C4-7DeUiveaIKTE3IkaSKjzA/edit?usp=sharing>`
65+
66+
This document serves as our central hub for all ongoing topics and will
67+
be updated regularly to reflect our progress. We welcome your
68+
contributions and feedback.
69+
5170
Meeting Materials
5271
=================
5372

@@ -60,9 +79,10 @@ on the LLVM Discourse forum: `Meeting Agendas and Minutes <https://discourse.llv
6079
Slides used to support discussions during sync-up meetings are stored in LLVM's GitHub repository.
6180

6281
Available slides:
63-
* `September 2025 <../qual-wg/slides/202509_llvm_qual_wg.pdf>`_
64-
* `August 2025 <../qual-wg/slides/202508_llvm_qual_wg.pdf>`_
65-
* `July 2025 <../qual-wg/slides/202507_llvm_qual_wg.pdf>`_
82+
83+
* `September 2025 <qual-wg/slides/202509_llvm_qual_wg.pdf>`_
84+
* `August 2025 <qual-wg/slides/202508_llvm_qual_wg.pdf>`_
85+
* `July 2025 <qual-wg/slides/202507_llvm_qual_wg.pdf>`_
6686
* (add future entries here)
6787

6888
A future patch will migrate these slide files to the `llvm-www` repository, once

llvm/include/llvm/Support/AMDHSAKernelDescriptor.h

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -252,8 +252,7 @@ enum : int32_t {
252252
KERNEL_CODE_PROPERTY(ENABLE_SGPR_DISPATCH_ID, 4, 1),
253253
KERNEL_CODE_PROPERTY(ENABLE_SGPR_FLAT_SCRATCH_INIT, 5, 1),
254254
KERNEL_CODE_PROPERTY(ENABLE_SGPR_PRIVATE_SEGMENT_SIZE, 6, 1),
255-
KERNEL_CODE_PROPERTY(RESERVED0, 7, 2),
256-
KERNEL_CODE_PROPERTY(USES_CU_STORES, 9, 1), // GFX12.5 +cu-stores
255+
KERNEL_CODE_PROPERTY(RESERVED0, 7, 3),
257256
KERNEL_CODE_PROPERTY(ENABLE_WAVEFRONT_SIZE32, 10, 1), // GFX10+
258257
KERNEL_CODE_PROPERTY(USES_DYNAMIC_STACK, 11, 1),
259258
KERNEL_CODE_PROPERTY(RESERVED1, 12, 4),

0 commit comments

Comments
 (0)