Skip to content

Commit

Permalink
generalize warp size in pixel clustering
Browse files Browse the repository at this point in the history
  • Loading branch information
AuroraPerego committed Oct 18, 2024
1 parent 5d7641b commit cf3b297
Showing 1 changed file with 7 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -182,8 +182,13 @@ namespace ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering {
TrackerTraits::maxPixInModule,
TrackerTraits::clusterBits,
uint16_t>;
#if defined(__HIP_DEVICE_COMPILE__)
constexpr auto warpSize = __AMDGCN_WAVEFRONT_SIZE;
#else
constexpr auto warpSize = 32;
#endif
auto& hist = alpaka::declareSharedVar<Hist, __COUNTER__>(acc);
auto& ws = alpaka::declareSharedVar<typename Hist::Counter[32], __COUNTER__>(acc);
auto& ws = alpaka::declareSharedVar<typename Hist::Counter[warpSize], __COUNTER__>(acc);
for (uint32_t j : cms::alpakatools::independent_group_elements(acc, Hist::totbins())) {
hist.off[j] = 0;
}
Expand Down Expand Up @@ -254,7 +259,7 @@ namespace ALPAKA_ACCELERATOR_NAMESPACE::pixelClustering {
}
}
alpaka::syncBlockThreads(acc); // FIXME this can be removed
for (uint32_t i : cms::alpakatools::independent_group_elements(acc, 32u)) {
for (uint32_t i : cms::alpakatools::independent_group_elements(acc, warpSize)) {
ws[i] = 0; // used by prefix scan...
}
alpaka::syncBlockThreads(acc);
Expand Down

0 comments on commit cf3b297

Please sign in to comment.