@@ -226,14 +226,14 @@ __global__ void erase(InputIt first,
226226
227227 std::size_t thread_num_successes = 0 ;
228228
229- auto tid = block_size * blockIdx .x + threadIdx .x ;
230- auto it = first + tid;
229+ auto tid = block_size * blockIdx .x + threadIdx .x ;
230+ auto it = first + tid;
231231
232- if (num_submaps > 1 ) {
233- for (int i = threadIdx .x ; i < num_submaps; i += block_size)
232+ if (num_submaps > 1 ) {
233+ for (int i = threadIdx .x ; i < num_submaps; i += block_size)
234234 submap_block_num_successes[i] = 0 ;
235235 __syncthreads ();
236-
236+
237237 while (it < last) {
238238 int i;
239239 for (i = 0 ; i < num_submaps; ++i) {
@@ -247,8 +247,7 @@ __global__ void erase(InputIt first,
247247 }
248248 } else {
249249 while (it < last) {
250- if (submap_mutable_views[0 ].erase (*it, hash, key_equal))
251- thread_num_successes++;
250+ if (submap_mutable_views[0 ].erase (*it, hash, key_equal)) thread_num_successes++;
252251 it += gridDim .x * blockDim .x ;
253252 }
254253 }
@@ -258,11 +257,11 @@ __global__ void erase(InputIt first,
258257 num_successes->fetch_add (block_num_successes, cuda::std::memory_order_relaxed);
259258 }
260259
261- if (num_submaps > 1 ) {
262- for (int i = 0 ; i < num_submaps; ++i) {
263- if (threadIdx .x == 0 ) {
264- submap_num_successes[i]->fetch_add (
265- static_cast <std:: size_t >(submap_block_num_successes[i]), cuda::std::memory_order_relaxed);
260+ if (num_submaps > 1 ) {
261+ for (int i = 0 ; i < num_submaps; ++i) {
262+ if (threadIdx .x == 0 ) {
263+ submap_num_successes[i]->fetch_add (static_cast <std:: size_t >(submap_block_num_successes[i]),
264+ cuda::std::memory_order_relaxed);
266265 }
267266 }
268267 }
@@ -303,13 +302,13 @@ template <uint32_t block_size,
303302 typename Hash,
304303 typename KeyEqual>
305304__global__ void erase (InputIt first,
306- InputIt last,
307- mutableViewT* submap_mutable_views,
308- atomicT* num_successes,
309- atomicT** submap_num_successes,
310- const uint32_t num_submaps,
311- Hash hash,
312- KeyEqual key_equal)
305+ InputIt last,
306+ mutableViewT* submap_mutable_views,
307+ atomicT* num_successes,
308+ atomicT** submap_num_successes,
309+ const uint32_t num_submaps,
310+ Hash hash,
311+ KeyEqual key_equal)
313312{
314313 typedef cub::BlockReduce<std::size_t , block_size> BlockReduce;
315314 __shared__ typename BlockReduce::TempStorage temp_storage;
@@ -321,13 +320,13 @@ __global__ void erase(InputIt first,
321320 auto tid = block_size * blockIdx .x + threadIdx .x ;
322321 auto it = first + tid / tile_size;
323322
324- if (num_submaps > 1 ) {
325- for (int i = threadIdx .x ; i < num_submaps; i += block_size)
323+ if (num_submaps > 1 ) {
324+ for (int i = threadIdx .x ; i < num_submaps; i += block_size)
326325 submap_block_num_successes[i] = 0 ;
327326 __syncthreads ();
328-
327+
329328 while (it < last) {
330- auto erased = false ;
329+ auto erased = false ;
331330 int i;
332331 for (i = 0 ; i < num_submaps; ++i) {
333332 erased = submap_mutable_views[i].erase (tile, *it, hash, key_equal);
@@ -342,8 +341,7 @@ __global__ void erase(InputIt first,
342341 } else {
343342 while (it < last) {
344343 auto erased = submap_mutable_views[0 ].erase (tile, *it, hash, key_equal);
345- if (erased && tile.thread_rank () == 0 )
346- thread_num_successes++;
344+ if (erased && tile.thread_rank () == 0 ) thread_num_successes++;
347345
348346 it += (gridDim .x * blockDim .x ) / tile_size;
349347 }
@@ -354,11 +352,11 @@ __global__ void erase(InputIt first,
354352 num_successes->fetch_add (block_num_successes, cuda::std::memory_order_relaxed);
355353 }
356354
357- if (num_submaps > 1 ) {
358- for (int i = 0 ; i < num_submaps; ++i) {
359- if (threadIdx .x == 0 ) {
360- submap_num_successes[i]->fetch_add (
361- static_cast <std:: size_t >(submap_block_num_successes[i]), cuda::std::memory_order_relaxed);
355+ if (num_submaps > 1 ) {
356+ for (int i = 0 ; i < num_submaps; ++i) {
357+ if (threadIdx .x == 0 ) {
358+ submap_num_successes[i]->fetch_add (static_cast <std:: size_t >(submap_block_num_successes[i]),
359+ cuda::std::memory_order_relaxed);
362360 }
363361 }
364362 }
0 commit comments