-
Notifications
You must be signed in to change notification settings - Fork 197
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
select_k: Replace specialization by split header
- Loading branch information
1 parent
d0063ff
commit ee8d78b
Showing
14 changed files
with
300 additions
and
177 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
/* | ||
* Copyright (c) 2022-2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#pragma once | ||
|
||
#include <cstdint> // uint32_t | ||
#include <cuda_fp16.h> // __half | ||
#include <raft/util/raft_explicit.hpp> // RAFT_EXPLICIT | ||
#include <rmm/cuda_stream_view.hpp> // rmm:cuda_stream_view | ||
#include <rmm/mr/device/device_memory_resource.hpp> // rmm::mr::device_memory_resource | ||
|
||
#ifdef RAFT_EXPLICIT_INSTANTIATE_ONLY | ||
|
||
namespace raft::matrix::detail { | ||
|
||
template <typename T, typename IdxT> | ||
void select_k(const T* in_val, | ||
const IdxT* in_idx, | ||
size_t batch_size, | ||
size_t len, | ||
int k, | ||
T* out_val, | ||
IdxT* out_idx, | ||
bool select_min, | ||
rmm::cuda_stream_view stream, | ||
rmm::mr::device_memory_resource* mr = nullptr) RAFT_EXPLICIT; | ||
} // namespace raft::matrix::detail | ||
|
||
#endif // RAFT_EXPLICIT_INSTANTIATE_ONLY | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
extern template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(__half, uint32_t); | ||
instantiate_raft_matrix_detail_select_k(__half, int64_t); | ||
instantiate_raft_matrix_detail_select_k(float, int64_t); | ||
instantiate_raft_matrix_detail_select_k(float, uint32_t); | ||
// We did not have these two for double before, but there are tests for them. We | ||
// therefore include them here. | ||
instantiate_raft_matrix_detail_select_k(double, int64_t); | ||
instantiate_raft_matrix_detail_select_k(double, uint32_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
/* | ||
* Copyright (c) 2022-2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#pragma once | ||
|
||
#if !defined(RAFT_EXPLICIT_INSTANTIATE_ONLY) | ||
#include "select_k-inl.cuh" | ||
#endif | ||
|
||
#ifdef RAFT_COMPILED | ||
#include "select_k-ext.cuh" | ||
#endif |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(double, int64_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,34 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <cstdint> // uint32_t | ||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(double, uint32_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(float, int64_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(float, uint32_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(__half, int64_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
/* | ||
* Copyright (c) 2023, NVIDIA CORPORATION. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
#include <raft/matrix/detail/select_k-inl.cuh> | ||
|
||
#define instantiate_raft_matrix_detail_select_k(T, IdxT) \ | ||
template void raft::matrix::detail::select_k(const T* in_val, \ | ||
const IdxT* in_idx, \ | ||
size_t batch_size, \ | ||
size_t len, \ | ||
int k, \ | ||
T* out_val, \ | ||
IdxT* out_idx, \ | ||
bool select_min, \ | ||
rmm::cuda_stream_view stream, \ | ||
rmm::mr::device_memory_resource* mr) | ||
|
||
instantiate_raft_matrix_detail_select_k(__half, uint32_t); | ||
|
||
#undef instantiate_raft_matrix_detail_select_k |
36 changes: 0 additions & 36 deletions
36
cpp/src/matrix/specializations/detail/select_k_float_int64_t.cu
This file was deleted.
Oops, something went wrong.
Oops, something went wrong.