Fix issues with thrust benchmarks

miscco · miscco · commit 6597b5fbbbc7 · 2026-03-19T14:32:44.000+01:00
diff --git a/thrust/benchmarks/bench/find/basic.cu b/thrust/benchmarks/bench/find/basic.cu
@@ -1,12 +1,5 @@
-//===----------------------------------------------------------------------===//
-//
-// Part of libcu++, the C++ Standard Library for your entire system,
-// under the Apache License v2.0 with LLVM Exceptions.
-// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
-//
-//===----------------------------------------------------------------------===//
 
 #include <thrust/device_vector.h>
 #include <thrust/find.h>
diff --git a/thrust/benchmarks/bench/find_if/basic.cu b/thrust/benchmarks/bench/find_if/basic.cu
@@ -1,15 +1,17 @@
-// SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+// SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 
-#include <thrust/detail/internal_functional.h>
 #include <thrust/device_vector.h>
-#include <thrust/fill.h>
 #include <thrust/find.h>
 
+#include <cuda/functional>
+#include <cuda/memory_pool>
+#include <cuda/stream>
+
 #include "nvbench_helper.cuh"
 
 template <typename T>
-void find_if(nvbench::state& state, nvbench::type_list<T>)
+static void basic(nvbench::state& state, nvbench::type_list<T>)
 {
   T val = 1;
   // set up input
@@ -24,13 +26,16 @@ void find_if(nvbench::state& state, nvbench::type_list<T>)
   state.add_global_memory_reads<T>(mismatch_point + 1);
   state.add_global_memory_writes<size_t>(1);
 
-  caching_allocator_t alloc;
-  state.exec(nvbench::exec_tag::no_batch | nvbench::exec_tag::sync, [&](nvbench::launch& launch) {
-    thrust::find_if(policy(alloc, launch), dinput.begin(), dinput.end(), cuda::equal_to_value<T>(val));
-  });
+  caching_allocator_t alloc{};
+
+  state.exec(nvbench::exec_tag::gpu | nvbench::exec_tag::no_batch | nvbench::exec_tag::sync,
+             [&](nvbench::launch& launch) {
+               do_not_optimize(
+                 thrust::find_if(policy(alloc, launch), dinput.begin(), dinput.end(), cuda::equal_to_value<T>{val}));
+             });
 }
 
-NVBENCH_BENCH_TYPES(find_if, NVBENCH_TYPE_AXES(fundamental_types))
+NVBENCH_BENCH_TYPES(basic, NVBENCH_TYPE_AXES(fundamental_types))
   .set_name("base")
   .add_int64_power_of_two_axis("Elements", nvbench::range(16, 28, 4))
-  .add_float64_axis("MismatchAt", std::vector{1.0, 0.5, 0.0});
+  .add_float64_axis("MismatchAt", std::vector{1.0, 0.5, 0.01});
diff --git a/thrust/benchmarks/bench/find_if_not/basic.cu b/thrust/benchmarks/bench/find_if_not/basic.cu
@@ -1,12 +1,5 @@
-//===----------------------------------------------------------------------===//
-//
-// Part of libcu++, the C++ Standard Library for your entire system,
-// under the Apache License v2.0 with LLVM Exceptions.
-// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
-//
-//===----------------------------------------------------------------------===//
 
 #include <thrust/device_vector.h>
 #include <thrust/find.h>
diff --git a/thrust/benchmarks/bench/is_sorted/basic.cu b/thrust/benchmarks/bench/is_sorted/basic.cu
@@ -1,12 +1,5 @@
-//===----------------------------------------------------------------------===//
-//
-// Part of libcu++, the C++ Standard Library for your entire system,
-// under the Apache License v2.0 with LLVM Exceptions.
-// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
-//
-//===----------------------------------------------------------------------===//
 
 #include <thrust/device_vector.h>
 #include <thrust/sequence.h>
diff --git a/thrust/benchmarks/bench/is_sorted_until/basic.cu b/thrust/benchmarks/bench/is_sorted_until/basic.cu
@@ -1,12 +1,5 @@
-//===----------------------------------------------------------------------===//
-//
-// Part of libcu++, the C++ Standard Library for your entire system,
-// under the Apache License v2.0 with LLVM Exceptions.
-// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-FileCopyrightText: Copyright (c) 2026, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
-//
-//===----------------------------------------------------------------------===//
 
 #include <thrust/device_vector.h>
 #include <thrust/sequence.h>
diff --git a/thrust/benchmarks/bench/mismatch/basic.cu b/thrust/benchmarks/bench/mismatch/basic.cu
@@ -5,8 +5,8 @@
 #include <thrust/fill.h>
 #include <thrust/mismatch.h>
 
+#include <cuda/iterator>
 #include <cuda/memory_pool>
-#include <cuda/std/__pstl_algorithm>
 #include <cuda/stream>
 
 #include "nvbench_helper.cuh"
@@ -40,39 +40,3 @@ NVBENCH_BENCH_TYPES(range_iter, NVBENCH_TYPE_AXES(fundamental_types))
   .set_name("base_range_iter")
   .add_int64_power_of_two_axis("Elements", nvbench::range(16, 28, 4))
   .add_float64_axis("MismatchAt", std::vector{1.0, 0.5, 0.01});
-
-template <typename T>
-static void range_range(nvbench::state& state, nvbench::type_list<T>)
-{
-  T val = 1;
-  // set up input
-  const auto elements       = static_cast<std::size_t>(state.get_int64("Elements"));
-  const auto common_prefix  = state.get_float64("MismatchAt");
-  const auto mismatch_point = static_cast<std::size_t>(elements * common_prefix);
-
-  thrust::device_vector<T> dinput(elements, thrust::no_init);
-  thrust::fill(dinput.begin(), dinput.begin() + mismatch_point, T{0});
-  thrust::fill(dinput.begin() + mismatch_point, dinput.end(), val);
-
-  state.add_global_memory_reads<T>(mismatch_point + 1);
-  state.add_global_memory_writes<size_t>(1);
-
-  cuda::stream stream{cuda::device_ref{0}};
-  cuda::device_memory_pool_ref alloc = cuda::device_default_memory_pool(stream.device());
-
-  auto policy = cuda::execution::__cub_par_unseq.with_stream(stream).with_memory_resource(alloc);
-  state.exec(nvbench::exec_tag::gpu | nvbench::exec_tag::no_batch | nvbench::exec_tag::sync,
-             [&](nvbench::launch& launch) {
-               (void) cuda::std::mismatch(
-                 policy.with_stream(launch.get_stream().get_stream()),
-                 dinput.begin(),
-                 dinput.end(),
-                 cuda::constant_iterator<T>{0},
-                 cuda::constant_iterator<T>{0, elements});
-             });
-}
-
-NVBENCH_BENCH_TYPES(range_range, NVBENCH_TYPE_AXES(fundamental_types))
-  .set_name("base_range_range")
-  .add_int64_power_of_two_axis("Elements", nvbench::range(16, 28, 4))
-  .add_float64_axis("MismatchAt", std::vector{1.0, 0.5, 0.01});
diff --git a/thrust/benchmarks/bench/transform/zip_transform.cu b/thrust/benchmarks/bench/transform/zip_transform.cu
@@ -3,10 +3,9 @@
 
 #include <thrust/device_vector.h>
 #include <thrust/execution_policy.h>
-#include <thrust/iterator/zip_iterator.h>
-#include <thrust/zip_function.h>
 
-#include <cuda/__functional/address_stability.h>
+#include <cuda/functional>
+#include <cuda/iterator>
 
 #include <nvbench_helper.cuh>