Skip to content
This repository has been archived by the owner on Nov 25, 2024. It is now read-only.

Commit

Permalink
Merge branch 'branch-24.06' into stdlib-migration
Browse files Browse the repository at this point in the history
  • Loading branch information
hcho3 authored May 3, 2024
2 parents 6feac65 + 7d7043e commit 21fb08c
Show file tree
Hide file tree
Showing 12 changed files with 1,268 additions and 85 deletions.
4 changes: 2 additions & 2 deletions cpp/src/graph_ops/append_unique_func.cuh
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
/*
* Copyright (c) 2019-2023, NVIDIA CORPORATION.
* Copyright (c) 2019-2024, NVIDIA CORPORATION.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
Expand Down Expand Up @@ -316,7 +316,7 @@ void graph_append_unique_func(void* target_nodes_ptr,
<<<num_blocks, kAssignThreadBlockSize, 0, stream>>>(value_id, bucket_count_ptr);
WM_CUDA_CHECK(cudaGetLastError());
wholememory_ops::wm_thrust_allocator thrust_allocator(p_env_fns);
thrust::exclusive_scan(thrust::cuda::par(thrust_allocator).on(stream),
thrust::exclusive_scan(thrust::cuda::par_nosync(thrust_allocator).on(stream),
bucket_count_ptr,
bucket_count_ptr + num_bucket_count,
(int*)bucket_prefix_sum_ptr);
Expand Down
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
/*
* Copyright (c) 2019-2023, NVIDIA CORPORATION.
* Copyright (c) 2019-2024, NVIDIA CORPORATION.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
Expand Down Expand Up @@ -337,7 +337,7 @@ void wholegraph_csr_unweighted_sample_without_replacement_func(

// prefix sum
wholememory_ops::wm_thrust_allocator thrust_allocator(p_env_fns);
thrust::exclusive_scan(thrust::cuda::par(thrust_allocator).on(stream),
thrust::exclusive_scan(thrust::cuda::par_nosync(thrust_allocator).on(stream),
tmp_sample_count_mem_pointer,
tmp_sample_count_mem_pointer + center_node_count + 1,
(int*)output_sample_offset);
Expand Down
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
/*
* Copyright (c) 2019-2023, NVIDIA CORPORATION.
* Copyright (c) 2019-2024, NVIDIA CORPORATION.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
Expand Down Expand Up @@ -462,7 +462,7 @@ void wholegraph_csr_weighted_sample_without_replacement_func(

// prefix sum
wholememory_ops::wm_thrust_allocator thrust_allocator(p_env_fns);
thrust::exclusive_scan(thrust::cuda::par(thrust_allocator).on(stream),
thrust::exclusive_scan(thrust::cuda::par_nosync(thrust_allocator).on(stream),
tmp_sample_count_mem_pointer,
tmp_sample_count_mem_pointer + center_node_count + 1,
static_cast<int*>(output_sample_offset));
Expand Down Expand Up @@ -500,7 +500,7 @@ void wholegraph_csr_weighted_sample_without_replacement_func(
raft::random::detail::DeviceState<raft::random::detail::PCGenerator> rngstate(_rngstate);
if (max_sample_count > sample_count_threshold) {
wholememory_ops::wm_thrust_allocator tmp_thrust_allocator(p_env_fns);
thrust::exclusive_scan(thrust::cuda::par(tmp_thrust_allocator).on(stream),
thrust::exclusive_scan(thrust::cuda::par_nosync(tmp_thrust_allocator).on(stream),
tmp_neighbor_counts_mem_pointer,
tmp_neighbor_counts_mem_pointer + center_node_count + 1,
tmp_neighbor_counts_mem_pointer);
Expand Down
Loading

0 comments on commit 21fb08c

Please sign in to comment.