Skip to content
This repository was archived by the owner on Mar 21, 2024. It is now read-only.

Commit

Permalink
Merge pull request #579 from canonizer/rank-warp-mask
Browse files Browse the repository at this point in the history
Mask of all ones in `SHFL_IDX_SYNC` in block radix rank
  • Loading branch information
gevtushenko authored Oct 12, 2022
2 parents dcd5b06 + f710ef8 commit 1fc34df
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions cub/block/block_radix_rank.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -1075,7 +1075,7 @@ struct BlockRadixRankMatchEarlyCounts
// atomic is a bit faster
warp_offset = atomicAdd(&warp_offsets[bin], popc);
}
warp_offset = SHFL_IDX_SYNC(warp_offset, leader, bin_mask);
warp_offset = SHFL_IDX_SYNC(warp_offset, leader, WARP_MASK);
if (lane == leader) *p_match_mask = 0;
WARP_SYNC(WARP_MASK);
ranks[u] = warp_offset + popc - 1;
Expand Down Expand Up @@ -1105,7 +1105,7 @@ struct BlockRadixRankMatchEarlyCounts
// atomic is a bit faster
warp_offset = atomicAdd(&warp_offsets[bin], popc);
}
warp_offset = SHFL_IDX_SYNC(warp_offset, leader, bin_mask);
warp_offset = SHFL_IDX_SYNC(warp_offset, leader, WARP_MASK);
ranks[u] = warp_offset + popc - 1;
}
}
Expand Down

0 comments on commit 1fc34df

Please sign in to comment.