NVIDIA
diff --git a/‎.devcontainer/cuda11.8-gcc11/devcontainer.json‎
Lines changed: 1 addition & 1 deletion b/‎.devcontainer/cuda11.8-gcc11/devcontainer.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎…ntainer/cuda12.6-gcc12/devcontainer.json‎ ‎…ntainer/cuda12.8-gcc12/devcontainer.json‎.devcontainer/cuda12.6-gcc12/devcontainer.json renamed to .devcontainer/cuda12.8-gcc12/devcontainer.json
Lines changed: 4 additions & 4 deletions b/‎…ntainer/cuda12.6-gcc12/devcontainer.json‎ ‎…ntainer/cuda12.8-gcc12/devcontainer.json‎.devcontainer/cuda12.6-gcc12/devcontainer.json renamed to .devcontainer/cuda12.8-gcc12/devcontainer.json
Lines changed: 4 additions & 4 deletions
diff --git a/‎…ntainer/cuda12.6-gcc13/devcontainer.json‎ ‎…ntainer/cuda12.8-gcc13/devcontainer.json‎.devcontainer/cuda12.6-gcc13/devcontainer.json renamed to .devcontainer/cuda12.8-gcc13/devcontainer.json
Lines changed: 4 additions & 4 deletions b/‎…ntainer/cuda12.6-gcc13/devcontainer.json‎ ‎…ntainer/cuda12.8-gcc13/devcontainer.json‎.devcontainer/cuda12.6-gcc13/devcontainer.json renamed to .devcontainer/cuda12.8-gcc13/devcontainer.json
Lines changed: 4 additions & 4 deletions
diff --git a/‎.devcontainer/devcontainer.json‎
Lines changed: 4 additions & 4 deletions b/‎.devcontainer/devcontainer.json‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎.pre-commit-config.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.pre-commit-config.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎CMakeLists.txt‎
Lines changed: 9 additions & 3 deletions b/‎CMakeLists.txt‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/CMakeLists.txt‎
Lines changed: 3 additions & 10 deletions b/‎benchmarks/CMakeLists.txt‎
Lines changed: 3 additions & 10 deletions
diff --git a/‎benchmarks/dynamic_map/retrieve_all_bench.cu‎
Lines changed: 92 additions & 0 deletions b/‎benchmarks/dynamic_map/retrieve_all_bench.cu‎
Lines changed: 92 additions & 0 deletions
diff --git a/‎ci/build.sh‎
Lines changed: 4 additions & 4 deletions b/‎ci/build.sh‎
Lines changed: 4 additions & 4 deletions
@@ -1,6 +1,6 @@
 {
   "shutdownAction": "stopContainer",
-  "image": "rapidsai/devcontainers:24.12-cpp-gcc11-cuda11.8-ubuntu22.04",
+  "image": "rapidsai/devcontainers:25.06-cpp-gcc11-cuda11.8-ubuntu22.04",
   "hostRequirements": {
     "gpu": true
   },
 
@@ -1,6 +1,6 @@
 {
   "shutdownAction": "stopContainer",
-  "image": "rapidsai/devcontainers:24.12-cpp-gcc12-cuda12.6-ubuntu22.04",
+  "image": "rapidsai/devcontainers:25.06-cpp-gcc12-cuda12.8-ubuntu22.04",
   "hostRequirements": {
     "gpu": true
   },
@@ -14,8 +14,8 @@
     "SCCACHE_BUCKET": "rapids-sccache-devs",
     "AWS_ROLE_ARN": "arn:aws:iam::279114543810:role/nv-gha-token-sccache-devs",
     "HISTFILE": "${containerWorkspaceFolder}/.cache/._bash_history",
-    "DEVCONTAINER_NAME": "cuda12.6-gcc12",
-    "CUCO_CUDA_VERSION": "12.6",
+    "DEVCONTAINER_NAME": "cuda12.8-gcc12",
+    "CUCO_CUDA_VERSION": "12.8",
     "CUCO_HOST_COMPILER": "gcc",
     "CUCO_HOST_COMPILER_VERSION": "12"
   },
@@ -38,5 +38,5 @@
       }
     }
   },
-  "name": "cuda12.6-gcc12"
+  "name": "cuda12.8-gcc12"
 }
@@ -1,6 +1,6 @@
 {
   "shutdownAction": "stopContainer",
-  "image": "rapidsai/devcontainers:24.12-cpp-gcc13-cuda12.6-ubuntu22.04",
+  "image": "rapidsai/devcontainers:25.06-cpp-gcc13-cuda12.8-ubuntu22.04",
   "hostRequirements": {
     "gpu": true
   },
@@ -14,8 +14,8 @@
     "SCCACHE_BUCKET": "rapids-sccache-devs",
     "AWS_ROLE_ARN": "arn:aws:iam::279114543810:role/nv-gha-token-sccache-devs",
     "HISTFILE": "${containerWorkspaceFolder}/.cache/._bash_history",
-    "DEVCONTAINER_NAME": "cuda12.6-gcc13",
-    "CUCO_CUDA_VERSION": "12.6",
+    "DEVCONTAINER_NAME": "cuda12.8-gcc13",
+    "CUCO_CUDA_VERSION": "12.8",
     "CUCO_HOST_COMPILER": "gcc",
     "CUCO_HOST_COMPILER_VERSION": "13"
   },
@@ -38,5 +38,5 @@
       }
     }
   },
-  "name": "cuda12.6-gcc13"
+  "name": "cuda12.8-gcc13"
 }
@@ -1,6 +1,6 @@
 {
   "shutdownAction": "stopContainer",
-  "image": "rapidsai/devcontainers:24.12-cpp-gcc13-cuda12.6-ubuntu22.04",
+  "image": "rapidsai/devcontainers:25.06-cpp-gcc13-cuda12.8-ubuntu22.04",
   "hostRequirements": {
     "gpu": true
   },
@@ -14,8 +14,8 @@
     "SCCACHE_BUCKET": "rapids-sccache-devs",
     "AWS_ROLE_ARN": "arn:aws:iam::279114543810:role/nv-gha-token-sccache-devs",
     "HISTFILE": "${containerWorkspaceFolder}/.cache/._bash_history",
-    "DEVCONTAINER_NAME": "cuda12.6-gcc13",
-    "CUCO_CUDA_VERSION": "12.6",
+    "DEVCONTAINER_NAME": "cuda12.8-gcc13",
+    "CUCO_CUDA_VERSION": "12.8",
     "CUCO_HOST_COMPILER": "gcc",
     "CUCO_HOST_COMPILER_VERSION": "13"
   },
@@ -38,5 +38,5 @@
       }
     }
   },
-  "name": "cuda12.6-gcc13"
+  "name": "cuda12.8-gcc13"
 }
@@ -10,7 +10,7 @@ ci:
 
 repos:
       - repo: https://github.com/pre-commit/mirrors-clang-format
-        rev: v18.1.8
+        rev: v20.1.4
         hooks:
               - id: clang-format
                 types_or: [c, c++, cuda]
 
@@ -1,5 +1,5 @@
 #=============================================================================
-# Copyright (c) 2018-2024, NVIDIA CORPORATION.
+# Copyright (c) 2018-2025, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,8 +15,10 @@
 #=============================================================================
 cmake_minimum_required(VERSION 3.23.1 FATAL_ERROR)
 
+set(rapids-cmake-version 25.06)
 if(NOT EXISTS ${CMAKE_CURRENT_BINARY_DIR}/CUCO_RAPIDS.cmake)
-    file(DOWNLOAD https://raw.githubusercontent.com/rapidsai/rapids-cmake/branch-25.02/RAPIDS.cmake
+    file(DOWNLOAD
+      https://raw.githubusercontent.com/rapidsai/rapids-cmake/branch-${rapids-cmake-version}/RAPIDS.cmake
          ${CMAKE_CURRENT_BINARY_DIR}/CUCO_RAPIDS.cmake)
 endif()
 include(${CMAKE_CURRENT_BINARY_DIR}/CUCO_RAPIDS.cmake)
@@ -94,9 +96,13 @@ if(BUILD_TESTS)
 endif(BUILD_TESTS)
 
 ###################################################################################################
-# - Optionally build google benchmarks ------------------------------------------------------------
+# - Optionally build nvbench benchmarks -----------------------------------------------------------
 
 if(BUILD_BENCHMARKS)
+    include(${rapids-cmake-dir}/cpm/nvbench.cmake)
+    include(${rapids-cmake-dir}/cpm/package_override.cmake)
+    rapids_cpm_nvbench(BUILD_STATIC)
+
     add_subdirectory(benchmarks)
 endif(BUILD_BENCHMARKS)
 
 
@@ -1,5 +1,5 @@
 #=============================================================================
-# Copyright (c) 2018-2024, NVIDIA CORPORATION.
+# Copyright (c) 2018-2025, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,14 +15,6 @@
 #=============================================================================
 cmake_minimum_required(VERSION 3.23.1 FATAL_ERROR)
 
-CPMAddPackage(
-  NAME nvbench
-  GITHUB_REPOSITORY NVIDIA/nvbench
-  GIT_TAG main
-  GIT_SHALLOW TRUE
-  EXCLUDE_FROM_ALL YES
-)
-
 ###################################################################################################
 ### compiler function #############################################################################
 ###################################################################################################
@@ -89,7 +81,8 @@ ConfigureBench(DYNAMIC_MAP_BENCH
   dynamic_map/insert_bench.cu
   dynamic_map/find_bench.cu
   dynamic_map/contains_bench.cu
-  dynamic_map/erase_bench.cu)
+  dynamic_map/erase_bench.cu
+  dynamic_map/retrieve_all_bench.cu)
 
 ###################################################################################################
 # - hash function benchmarks ----------------------------------------------------------------------
 
@@ -0,0 +1,92 @@
+/*
+ * Copyright (c) 2025, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <benchmark_defaults.hpp>
+#include <benchmark_utils.hpp>
+
+#include <cuco/dynamic_map.cuh>
+#include <cuco/utility/key_generator.cuh>
+
+#include <nvbench/nvbench.cuh>
+
+#include <thrust/device_vector.h>
+#include <thrust/transform.h>
+
+using namespace cuco::benchmark;  // defaults, dist_from_state
+using namespace cuco::utility;    // key_generator, distribution
+
+/**
+ * @brief A benchmark evaluating `cuco::dynamic_map::retrieve_all` performance
+ */
+template <typename Key, typename Value, typename Dist>
+std::enable_if_t<(sizeof(Key) == sizeof(Value)), void> dynamic_map_retrieve_all(
+  nvbench::state& state, nvbench::type_list<Key, Value, Dist>)
+{
+  using pair_type = cuco::pair<Key, Value>;
+
+  auto const num_keys     = state.get_int64("NumInputs");
+  auto const initial_size = state.get_int64("InitSize");
+
+  thrust::device_vector<Key> keys(num_keys);
+
+  key_generator gen;
+  gen.generate(dist_from_state<Dist>(state), keys.begin(), keys.end());
+
+  thrust::device_vector<pair_type> pairs(num_keys);
+  thrust::transform(keys.begin(), keys.end(), pairs.begin(), [] __device__(Key const& key) {
+    return pair_type(key, {});
+  });
+
+  cuco::dynamic_map<Key, Value> map{
+    static_cast<size_t>(initial_size), cuco::empty_key<Key>{-1}, cuco::empty_value<Value>{-1}};
+  map.insert(pairs.begin(), pairs.end());
+  // Prepare output buffers
+  thrust::device_vector<Key> retrieved_keys(map.get_size());
+  thrust::device_vector<Value> retrieved_values(map.get_size());
+
+  state.add_element_count(map.get_size());
+
+  state.exec(nvbench::exec_tag::sync, [&](nvbench::launch& launch) {
+    map.retrieve_all(retrieved_keys.begin(), retrieved_values.begin(), launch.get_stream());
+  });
+}
+
+template <typename Key, typename Value, typename Dist>
+std::enable_if_t<(sizeof(Key) != sizeof(Value)), void> dynamic_map_retrieve_all(
+  nvbench::state& state, nvbench::type_list<Key, Value, Dist>)
+{
+  state.skip("Key should be the same type as Value.");
+}
+
+NVBENCH_BENCH_TYPES(dynamic_map_retrieve_all,
+                    NVBENCH_TYPE_AXES(defaults::KEY_TYPE_RANGE,
+                                      defaults::VALUE_TYPE_RANGE,
+                                      nvbench::type_list<distribution::unique>))
+  .set_name("dynamic_map_retrieve_all_unique_capacity")
+  .set_type_axes_names({"Key", "Value", "Distribution"})
+  .set_max_noise(defaults::MAX_NOISE)
+  .add_int64_axis("NumInputs", defaults::N_RANGE)
+  .add_int64_axis("InitSize", {defaults::INITIAL_SIZE});
+
+NVBENCH_BENCH_TYPES(dynamic_map_retrieve_all,
+                    NVBENCH_TYPE_AXES(defaults::KEY_TYPE_RANGE,
+                                      defaults::VALUE_TYPE_RANGE,
+                                      nvbench::type_list<distribution::unique>))
+  .set_name("dynamic_map_retrieve_all_fixed_capacity")
+  .set_type_axes_names({"Key", "Value", "Distribution"})
+  .set_max_noise(defaults::MAX_NOISE)
+  .add_int64_axis("NumInputs", {defaults::N})
+  .add_int64_axis("InitSize", {defaults::INITIAL_SIZE});
@@ -134,17 +134,17 @@ while [ "${#args[@]}" -ne 0 ]; do
     esac
 done
 
+if [ $VERBOSE ]; then
+    set -x
+fi
+
 # Convert to full paths:
 HOST_COMPILER=$(which ${HOST_COMPILER})
 CUDA_COMPILER=$(which ${CUDA_COMPILER})
 CMAKE_BINARY=$(which ${CMAKE_BINARY})
 # Make CUDA arch list compatible with cmake
 CUDA_ARCHS=$(echo "$CUDA_ARCHS" | tr ' ,' ';;')
 
-if [ $VERBOSE ]; then
-    set -x
-fi
-
 # Begin processing unsets after option parsing
 set -u
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"shutdownAction": "stopContainer",`
`3`		`- "image": "rapidsai/devcontainers:24.12-cpp-gcc11-cuda11.8-ubuntu22.04",`
	`3`	`+ "image": "rapidsai/devcontainers:25.06-cpp-gcc11-cuda11.8-ubuntu22.04",`
`4`	`4`	`"hostRequirements": {`
`5`	`5`	`"gpu": true`
`6`	`6`	`},`