Skip to content

Commit 7bb5f5c

Browse files
author
iclsrc
committed
Merge from 'sycl' to 'sycl-web' (18 commits)
2 parents 8c017d6 + 9457ac2 commit 7bb5f5c

File tree

56 files changed

+2447
-1704
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

56 files changed

+2447
-1704
lines changed

.github/workflows/libcxx-check-generated-files.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ jobs:
1515
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
1616

1717
- name: Install dependencies
18-
uses: aminya/setup-cpp@9dc9c217f497fe7342eed97e6f200bf101c9cc04 # v1.6.2
18+
uses: aminya/setup-cpp@004edc19527a83d56cda032658aab55c5e2ed48f # v1.7.0
1919
with:
2020
clangformat: 17.0.1
2121
ninja: true

.github/workflows/pr-code-format.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ jobs:
5555
echo "$CHANGED_FILES"
5656
5757
- name: Install clang-format
58-
uses: aminya/setup-cpp@9dc9c217f497fe7342eed97e6f200bf101c9cc04 # v1.6.2
58+
uses: aminya/setup-cpp@004edc19527a83d56cda032658aab55c5e2ed48f # v1.7.0
5959
with:
6060
clangformat: 20.1.5
6161

.github/workflows/release-lit.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ jobs:
4545
./llvm/utils/release/./github-upload-release.py --token "$GITHUB_TOKEN" --user ${{ github.actor }} --user-token "$USER_TOKEN" check-permissions
4646
4747
- name: Setup Cpp
48-
uses: aminya/setup-cpp@9dc9c217f497fe7342eed97e6f200bf101c9cc04 # v1.6.2
48+
uses: aminya/setup-cpp@004edc19527a83d56cda032658aab55c5e2ed48f # v1.7.0
4949
with:
5050
compiler: llvm-16.0.6
5151
cmake: true

clang/include/clang/Driver/Driver.h

Lines changed: 0 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -775,25 +775,6 @@ class Driver {
775775
/// Get the specific kind of offload LTO being performed.
776776
LTOKind getOffloadLTOMode() const { return OffloadLTOMode; }
777777

778-
// FPGA Offload Modes.
779-
enum DeviceMode {
780-
UnsetDeviceMode,
781-
FPGAHWMode,
782-
FPGAEmulationMode
783-
} OffloadCompileMode = UnsetDeviceMode;
784-
785-
bool IsFPGAHWMode() const { return OffloadCompileMode == FPGAHWMode; }
786-
787-
bool IsFPGAEmulationMode() const {
788-
return OffloadCompileMode == FPGAEmulationMode;
789-
}
790-
791-
void setOffloadCompileMode(DeviceMode ModeValue) {
792-
OffloadCompileMode = ModeValue;
793-
}
794-
795-
DeviceMode getOffloadCompileMode() { return OffloadCompileMode; }
796-
797778
/// Get the CUID option.
798779
const CUIDOptions &getCUIDOpts() const { return CUIDOpts; }
799780

@@ -893,9 +874,6 @@ class Driver {
893874
void checkForOffloadMismatch(Compilation &C,
894875
llvm::opt::DerivedArgList &Args) const;
895876

896-
/// Track filename used for the FPGA dependency info.
897-
mutable llvm::StringMap<const std::string> FPGATempDepFiles;
898-
899877
/// A list of inputs and their corresponding integration headers. These
900878
/// files are generated during the device compilation and are consumed
901879
/// by the host compilation.
@@ -948,18 +926,6 @@ class Driver {
948926
/// getUseNewOffloadingDriver - use the new offload driver for OpenMP.
949927
bool getUseNewOffloadingDriver() const { return UseNewOffloadingDriver; };
950928

951-
/// addFPGATempDepFile - Add a file to be added to the bundling step of
952-
/// an FPGA object.
953-
void addFPGATempDepFile(const std::string &DepName,
954-
const std::string &FileName) const {
955-
FPGATempDepFiles.insert({FileName, DepName});
956-
}
957-
/// getFPGATempDepFile - Get a file to be added to the bundling step of
958-
/// an FPGA object.
959-
const std::string getFPGATempDepFile(const std::string &FileName) const {
960-
return FPGATempDepFiles[FileName];
961-
}
962-
963929
/// isSYCLDefaultTripleImplied - The default SYCL triple (spir64) has been
964930
/// added or should be added given proper criteria.
965931
bool isSYCLDefaultTripleImplied() const { return SYCLDefaultTripleImplied; };

devops/scripts/benchmarks/benches/compute.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -466,6 +466,7 @@ def bin_args(self) -> list[str]:
466466
f"--src={self.destination}",
467467
f"--dst={self.destination}",
468468
f"--size={self.size}",
469+
"--withCopyOffload=0",
469470
]
470471

471472

@@ -501,6 +502,7 @@ def bin_args(self) -> list[str]:
501502
f"--destinationPlacement={self.destination}",
502503
f"--size={self.size}",
503504
"--count=100",
505+
"--withCopyOffload=0",
504506
]
505507

506508

devops/scripts/benchmarks/options.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,7 @@ class Options:
6565
build_compute_runtime: bool = False
6666
extra_ld_libraries: list[str] = field(default_factory=list)
6767
extra_env_vars: dict = field(default_factory=dict)
68-
compute_runtime_tag: str = "25.13.33276.18"
68+
compute_runtime_tag: str = "25.22.33944.4"
6969
build_igc: bool = False
7070
current_run_name: str = "This PR"
7171
preset: str = "Full"

devops/scripts/install_drivers.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22

33
set -e
44
set -x
5+
set -o pipefail
56

67
if [ -f "$1" ]; then
78
# Read data from the dependencies.json passed as the first argument.

lldb/tools/lldb-dap/package-lock.json

Lines changed: 3 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

llvm/docs/requirements-hashed.txt

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -298,9 +298,9 @@ recommonmark==0.7.1 \
298298
--hash=sha256:1b1db69af0231efce3fa21b94ff627ea33dee7079a01dd0a7f8482c3da148b3f \
299299
--hash=sha256:bdb4db649f2222dcd8d2d844f0006b958d627f732415d399791ee436a3686d67
300300
# via -r requirements.txt
301-
requests==2.32.3 \
302-
--hash=sha256:55365417734eb18255590a9ff9eb97e9e1da868d4ccd6402399eaf68af20a760 \
303-
--hash=sha256:70761cfe03c773ceb22aa2f671b4757976145175cdfca038c02654d061d6dcc6
301+
requests==2.32.4 \
302+
--hash=sha256:27babd3cda2a6d50b30443204ee89830707d396671944c998b5975b031ac2b2c \
303+
--hash=sha256:27d0316682c8a29834d3264820024b62a36942083d52caf2f14c0591336d3422
304304
# via sphinx
305305
snowballstemmer==3.0.1 \
306306
--hash=sha256:6cd7b3897da8d6c9ffb968a6781fa6532dce9c3618a4b127d920dab764a19064 \

llvm/include/llvm/SYCLLowerIR/DeviceConfigFile.td

Lines changed: 45 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -321,38 +321,49 @@ defvar HipSubgroupSizesGCN5 = [64]; // gfx900-gfx906 GCN5.0 (known as "Vega"
321321
defvar HipSubgroupSizesRDNA = [32]; // gfxX10-gfx11 (encapsulates RDNA1..3), (wave64 mode available but not used).
322322
defvar HipSubgroupSizesCDNA = [64]; // gfx908, gfx90a (encapsulates CDNA1..2)
323323

324-
defvar HipMinAspects = [AspectGpu, AspectFp64, AspectOnline_compiler, AspectOnline_linker, AspectQueue_profiling,
325-
AspectExt_intel_pci_address, AspectExt_intel_max_mem_bandwidth, AspectExt_intel_device_id,
326-
AspectExt_intel_memory_clock_rate, AspectExt_intel_memory_bus_width, AspectExt_intel_free_memory];
324+
defvar HipMinAspects = [AspectGpu, AspectFp16, AspectFp64,
325+
AspectOnline_compiler, AspectOnline_linker, AspectQueue_profiling,
326+
AspectExt_intel_pci_address, AspectExt_intel_max_mem_bandwidth,
327+
AspectExt_intel_device_id, AspectExt_intel_memory_clock_rate,
328+
AspectExt_intel_memory_bus_width, AspectExt_intel_free_memory];
327329

330+
defvar HipUSMAspects = !listremove(AllUSMAspects, [AspectUsm_system_allocations]);
331+
defvar HipGraphAspects = [AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph];
328332
// The following AMDGCN targets are ordered based on their ROCm driver support:
329333
//
330334
// Officially supported:
331-
def : HipTargetInfo<"amd_gpu_gfx908", !listconcat(HipMinAspects, AllUSMAspects,
332-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]), HipSubgroupSizesCDNA>;
333-
def : HipTargetInfo<"amd_gpu_gfx90a", !listconcat(HipMinAspects, AllUSMAspects,
334-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph, AspectExt_oneapi_native_assert]),
335+
def : HipTargetInfo<"amd_gpu_gfx908", !listconcat(
336+
HipMinAspects, HipUSMAspects, HipGraphAspects,
337+
[AspectExt_intel_device_info_uuid]), HipSubgroupSizesCDNA>;
338+
def : HipTargetInfo<"amd_gpu_gfx90a", !listconcat(
339+
HipMinAspects, HipUSMAspects, HipGraphAspects,
340+
[AspectAtomic64, AspectExt_intel_device_info_uuid, AspectExt_oneapi_native_assert]),
335341
HipSubgroupSizesCDNA>;
336342
// TODO: Need to verify whether device-side asserts (oneapi_native_assert) are
337343
// now working for the new CDNA3 gfx940, gfx941, gfx942 GPUs and fixed for the
338344
// other supported, gfx1030 and gfx1100, RDNA3 GPUs.
339-
def : HipTargetInfo<"amd_gpu_gfx940", !listconcat(HipMinAspects, AllUSMAspects,
340-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]),
345+
def : HipTargetInfo<"amd_gpu_gfx940", !listconcat(
346+
HipMinAspects, HipUSMAspects, HipGraphAspects,
347+
[AspectExt_intel_device_info_uuid]),
341348
HipSubgroupSizesCDNA>;
342-
def : HipTargetInfo<"amd_gpu_gfx941", !listconcat(HipMinAspects, AllUSMAspects,
343-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]),
349+
def : HipTargetInfo<"amd_gpu_gfx941", !listconcat(
350+
HipMinAspects, HipUSMAspects, HipGraphAspects,
351+
[AspectExt_intel_device_info_uuid]),
344352
HipSubgroupSizesCDNA>;
345-
def : HipTargetInfo<"amd_gpu_gfx942", !listconcat(HipMinAspects, AllUSMAspects,
346-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]),
353+
def : HipTargetInfo<"amd_gpu_gfx942", !listconcat(
354+
HipMinAspects, HipUSMAspects, HipGraphAspects,
355+
[AspectExt_intel_device_info_uuid]),
347356
HipSubgroupSizesCDNA>;
348-
def : HipTargetInfo<"amd_gpu_gfx1030", !listconcat(HipMinAspects, AllUSMAspects,
349-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]),
357+
def : HipTargetInfo<"amd_gpu_gfx1030", !listconcat(
358+
HipMinAspects, HipUSMAspects, HipGraphAspects,
359+
[AspectAtomic64, AspectExt_intel_device_info_uuid]),
350360
HipSubgroupSizesRDNA>;
351-
def : HipTargetInfo<"amd_gpu_gfx1100", !listconcat(HipMinAspects, AllUSMAspects,
352-
[AspectExt_intel_device_info_uuid, AspectExt_oneapi_graph, AspectExt_oneapi_limited_graph]),
361+
def : HipTargetInfo<"amd_gpu_gfx1100", !listconcat(
362+
HipMinAspects, HipUSMAspects, HipGraphAspects,
363+
[AspectExt_intel_device_info_uuid]),
353364
HipSubgroupSizesRDNA>;
354365
// Deprecated support:
355-
def : HipTargetInfo<"amd_gpu_gfx906", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesGCN5>;
366+
def : HipTargetInfo<"amd_gpu_gfx906", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesGCN5>;
356367
// Unsupported (or unofficially supported):
357368
def : HipTargetInfo<"amd_gpu_gfx700", HipMinAspects, HipSubgroupSizesGCN2>;
358369
def : HipTargetInfo<"amd_gpu_gfx701", HipMinAspects, HipSubgroupSizesGCN2>;
@@ -369,23 +380,23 @@ def : HipTargetInfo<"amd_gpu_gfx900", HipMinAspects, HipSubgroupSizesGCN5>;
369380
def : HipTargetInfo<"amd_gpu_gfx902", HipMinAspects, HipSubgroupSizesGCN5>;
370381
def : HipTargetInfo<"amd_gpu_gfx904", HipMinAspects, HipSubgroupSizesGCN5>;
371382
def : HipTargetInfo<"amd_gpu_gfx909", HipMinAspects, HipSubgroupSizesGCN5>;
372-
def : HipTargetInfo<"amd_gpu_gfx90c", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesGCN5>;
373-
def : HipTargetInfo<"amd_gpu_gfx1010", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
374-
def : HipTargetInfo<"amd_gpu_gfx1011", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
375-
def : HipTargetInfo<"amd_gpu_gfx1012", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
376-
def : HipTargetInfo<"amd_gpu_gfx1013", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
377-
def : HipTargetInfo<"amd_gpu_gfx1031", !listconcat(!listremove(HipMinAspects, [AspectExt_intel_free_memory]), AllUSMAspects),
383+
def : HipTargetInfo<"amd_gpu_gfx90c", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesGCN5>;
384+
def : HipTargetInfo<"amd_gpu_gfx1010", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
385+
def : HipTargetInfo<"amd_gpu_gfx1011", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
386+
def : HipTargetInfo<"amd_gpu_gfx1012", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
387+
def : HipTargetInfo<"amd_gpu_gfx1013", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
388+
def : HipTargetInfo<"amd_gpu_gfx1031", !listconcat(!listremove(HipMinAspects, [AspectExt_intel_free_memory]), HipUSMAspects),
378389
HipSubgroupSizesRDNA>;
379-
def : HipTargetInfo<"amd_gpu_gfx1032", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
380-
def : HipTargetInfo<"amd_gpu_gfx1033", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
381-
def : HipTargetInfo<"amd_gpu_gfx1034", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
382-
def : HipTargetInfo<"amd_gpu_gfx1035", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
383-
def : HipTargetInfo<"amd_gpu_gfx1036", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
384-
def : HipTargetInfo<"amd_gpu_gfx1101", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
385-
def : HipTargetInfo<"amd_gpu_gfx1102", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
386-
def : HipTargetInfo<"amd_gpu_gfx1103", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
387-
def : HipTargetInfo<"amd_gpu_gfx1150", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
388-
def : HipTargetInfo<"amd_gpu_gfx1151", !listconcat(HipMinAspects, AllUSMAspects), HipSubgroupSizesRDNA>;
390+
def : HipTargetInfo<"amd_gpu_gfx1032", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
391+
def : HipTargetInfo<"amd_gpu_gfx1033", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
392+
def : HipTargetInfo<"amd_gpu_gfx1034", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
393+
def : HipTargetInfo<"amd_gpu_gfx1035", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
394+
def : HipTargetInfo<"amd_gpu_gfx1036", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
395+
def : HipTargetInfo<"amd_gpu_gfx1101", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
396+
def : HipTargetInfo<"amd_gpu_gfx1102", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
397+
def : HipTargetInfo<"amd_gpu_gfx1103", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
398+
def : HipTargetInfo<"amd_gpu_gfx1150", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
399+
def : HipTargetInfo<"amd_gpu_gfx1151", !listconcat(HipMinAspects, HipUSMAspects), HipSubgroupSizesRDNA>;
389400
// TBA
390401
def : HipTargetInfo<"amd_gpu_gfx1200", [], []>; // RDNA 4
391402
def : HipTargetInfo<"amd_gpu_gfx1201", [], []>; // RDNA 4

0 commit comments

Comments
 (0)