-
Notifications
You must be signed in to change notification settings - Fork 920
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Work around issues with cccl main (#15552)
This gets cuDF build cccl main on 12.3. There is one issue with the cuco tuple helpers but that will be fixed on the cuco side --------- Co-authored-by: Bernhard Manfred Gruber <[email protected]> Co-authored-by: Bradley Dice <[email protected]> Co-authored-by: Nghia Truong <[email protected]> Co-authored-by: ptaylor <[email protected]> Co-authored-by: Paul Taylor <[email protected]> Co-authored-by: Yunsong Wang <[email protected]>
- Loading branch information
1 parent
8a40567
commit 29429f7
Showing
15 changed files
with
209 additions
and
27 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
47 changes: 47 additions & 0 deletions
47
cpp/cmake/thirdparty/patches/revert_pr_211_cccl_2.5.0.diff
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,47 @@ | ||
diff --git a/thrust/thrust/system/cuda/detail/internal/copy_device_to_device.h b/thrust/thrust/system/cuda/detail/internal/copy_device_to_device.h | ||
index 046eb83c0..8047c9701 100644 | ||
--- a/thrust/thrust/system/cuda/detail/internal/copy_device_to_device.h | ||
+++ b/thrust/thrust/system/cuda/detail/internal/copy_device_to_device.h | ||
@@ -53,41 +53,15 @@ namespace cuda_cub | ||
|
||
namespace __copy | ||
{ | ||
-template <class Derived, class InputIt, class OutputIt> | ||
-OutputIt THRUST_RUNTIME_FUNCTION device_to_device( | ||
- execution_policy<Derived>& policy, InputIt first, InputIt last, OutputIt result, thrust::detail::true_type) | ||
-{ | ||
- typedef typename thrust::iterator_traits<InputIt>::value_type InputTy; | ||
- const auto n = thrust::distance(first, last); | ||
- if (n > 0) | ||
- { | ||
- cudaError status; | ||
- status = trivial_copy_device_to_device( | ||
- policy, | ||
- reinterpret_cast<InputTy*>(thrust::raw_pointer_cast(&*result)), | ||
- reinterpret_cast<InputTy const*>(thrust::raw_pointer_cast(&*first)), | ||
- n); | ||
- cuda_cub::throw_on_error(status, "__copy:: D->D: failed"); | ||
- } | ||
- | ||
- return result + n; | ||
-} | ||
|
||
template <class Derived, class InputIt, class OutputIt> | ||
OutputIt THRUST_RUNTIME_FUNCTION device_to_device( | ||
- execution_policy<Derived>& policy, InputIt first, InputIt last, OutputIt result, thrust::detail::false_type) | ||
+ execution_policy<Derived>& policy, InputIt first, InputIt last, OutputIt result) | ||
{ | ||
typedef typename thrust::iterator_traits<InputIt>::value_type InputTy; | ||
return cuda_cub::transform(policy, first, last, result, thrust::identity<InputTy>()); | ||
} | ||
|
||
-template <class Derived, class InputIt, class OutputIt> | ||
-OutputIt THRUST_RUNTIME_FUNCTION | ||
-device_to_device(execution_policy<Derived>& policy, InputIt first, InputIt last, OutputIt result) | ||
-{ | ||
- return device_to_device( | ||
- policy, first, last, result, typename is_indirectly_trivially_relocatable_to<InputIt, OutputIt>::type()); | ||
-} | ||
} // namespace __copy | ||
|
||
} // namespace cuda_cub |
25 changes: 25 additions & 0 deletions
25
cpp/cmake/thirdparty/patches/thrust_disable_64bit_dispatching_cccl_2.5.0.diff
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
diff --git a/thrust/thrust/system/cuda/detail/dispatch.h b/thrust/thrust/system/cuda/detail/dispatch.h | ||
index 2a3cc4e33..8fb337b26 100644 | ||
--- a/thrust/thrust/system/cuda/detail/dispatch.h | ||
+++ b/thrust/thrust/system/cuda/detail/dispatch.h | ||
@@ -44,8 +44,7 @@ | ||
} \ | ||
else \ | ||
{ \ | ||
- auto THRUST_PP_CAT2(count, _fixed) = static_cast<thrust::detail::int64_t>(count); \ | ||
- status = call arguments; \ | ||
+ throw std::runtime_error("THRUST_INDEX_TYPE_DISPATCH 64-bit count is unsupported in libcudf"); \ | ||
} | ||
|
||
/** | ||
@@ -66,9 +65,7 @@ | ||
} \ | ||
else \ | ||
{ \ | ||
- auto THRUST_PP_CAT2(count1, _fixed) = static_cast<thrust::detail::int64_t>(count1); \ | ||
- auto THRUST_PP_CAT2(count2, _fixed) = static_cast<thrust::detail::int64_t>(count2); \ | ||
- status = call arguments; \ | ||
+ throw std::runtime_error("THRUST_DOUBLE_INDEX_TYPE_DISPATCH 64-bit count is unsupported in libcudf"); \ | ||
} | ||
/** | ||
* Dispatch between 32-bit and 64-bit index based versions of the same algorithm |
39 changes: 39 additions & 0 deletions
39
cpp/cmake/thirdparty/patches/thrust_faster_scan_compile_times_cccl_2.5.0.diff
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
diff --git a/cub/cub/device/dispatch/dispatch_radix_sort.cuh b/cub/cub/device/dispatch/dispatch_radix_sort.cuh | ||
index 0606485bb..dbb99ff13 100644 | ||
--- a/cub/cub/device/dispatch/dispatch_radix_sort.cuh | ||
+++ b/cub/cub/device/dispatch/dispatch_radix_sort.cuh | ||
@@ -1085,7 +1085,7 @@ struct DeviceRadixSortPolicy | ||
}; | ||
|
||
/// SM60 (GP100) | ||
- struct Policy600 : ChainedPolicy<600, Policy600, Policy500> | ||
+ struct Policy600 : ChainedPolicy<600, Policy600, Policy600> | ||
{ | ||
enum | ||
{ | ||
diff --git a/cub/cub/device/dispatch/dispatch_reduce.cuh b/cub/cub/device/dispatch/dispatch_reduce.cuh | ||
index f39613adb..75bd16ff9 100644 | ||
--- a/cub/cub/device/dispatch/dispatch_reduce.cuh | ||
+++ b/cub/cub/device/dispatch/dispatch_reduce.cuh | ||
@@ -488,7 +488,7 @@ struct DeviceReducePolicy | ||
}; | ||
|
||
/// SM60 | ||
- struct Policy600 : ChainedPolicy<600, Policy600, Policy350> | ||
+ struct Policy600 : ChainedPolicy<600, Policy600, Policy600> | ||
{ | ||
static constexpr int threads_per_block = 256; | ||
static constexpr int items_per_thread = 16; | ||
diff --git a/cub/cub/device/dispatch/tuning/tuning_scan.cuh b/cub/cub/device/dispatch/tuning/tuning_scan.cuh | ||
index 419908c4e..6ab0840e1 100644 | ||
--- a/cub/cub/device/dispatch/tuning/tuning_scan.cuh | ||
+++ b/cub/cub/device/dispatch/tuning/tuning_scan.cuh | ||
@@ -339,7 +339,7 @@ struct DeviceScanPolicy | ||
/// SM600 | ||
struct Policy600 | ||
: DefaultTuning | ||
- , ChainedPolicy<600, Policy600, Policy520> | ||
+ , ChainedPolicy<600, Policy600, Policy600> | ||
{}; | ||
|
||
/// SM800 |
39 changes: 39 additions & 0 deletions
39
cpp/cmake/thirdparty/patches/thrust_faster_sort_compile_times_cccl_2.5.0.diff
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
diff --git a/cub/cub/block/block_merge_sort.cuh b/cub/cub/block/block_merge_sort.cuh | ||
index eb76ebb0b..c6c529a50 100644 | ||
--- a/cub/cub/block/block_merge_sort.cuh | ||
+++ b/cub/cub/block/block_merge_sort.cuh | ||
@@ -95,7 +95,7 @@ _CCCL_DEVICE _CCCL_FORCEINLINE void SerialMerge( | ||
KeyT key1 = keys_shared[keys1_beg]; | ||
KeyT key2 = keys_shared[keys2_beg]; | ||
|
||
-#pragma unroll | ||
+#pragma unroll 1 | ||
for (int item = 0; item < ITEMS_PER_THREAD; ++item) | ||
{ | ||
bool p = (keys2_beg < keys2_end) && ((keys1_beg >= keys1_end) || compare_op(key2, key1)); | ||
@@ -376,7 +376,7 @@ public: | ||
// | ||
KeyT max_key = oob_default; | ||
|
||
-#pragma unroll | ||
+#pragma unroll 1 | ||
for (int item = 1; item < ITEMS_PER_THREAD; ++item) | ||
{ | ||
if (ITEMS_PER_THREAD * linear_tid + item < valid_items) | ||
diff --git a/cub/cub/thread/thread_sort.cuh b/cub/cub/thread/thread_sort.cuh | ||
index 7d9e8622f..da5627306 100644 | ||
--- a/cub/cub/thread/thread_sort.cuh | ||
+++ b/cub/cub/thread/thread_sort.cuh | ||
@@ -87,10 +87,10 @@ StableOddEvenSort(KeyT (&keys)[ITEMS_PER_THREAD], ValueT (&items)[ITEMS_PER_THRE | ||
{ | ||
constexpr bool KEYS_ONLY = ::cuda::std::is_same<ValueT, NullType>::value; | ||
|
||
-#pragma unroll | ||
+#pragma unroll 1 | ||
for (int i = 0; i < ITEMS_PER_THREAD; ++i) | ||
{ | ||
-#pragma unroll | ||
+#pragma unroll 1 | ||
for (int j = 1 & i; j < ITEMS_PER_THREAD - 1; j += 2) | ||
{ | ||
if (compare_op(keys[j + 1], keys[j])) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters