We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d0edb05 commit f603edfCopy full SHA for f603edf
src/popsift/common/excl_blk_prefix_sum.h
@@ -73,6 +73,7 @@ class Block
73
if( threadIdx.x == 0 && threadIdx.y == 0 ) {
74
loop_total = 0;
75
}
76
+ __syncthreads();
77
78
const int start = threadIdx.y * blockDim.x + threadIdx.x;
79
const int wrap = blockDim.x * blockDim.y;
@@ -131,9 +132,8 @@ class Block
131
132
*/
133
_mapping_writer.set( ebs, self, cell );
134
-
135
- // Wait to update loop_total until everyone is done.
136
__syncthreads();
+
137
if( threadIdx.y == 0 && threadIdx.x == 31 ) {
138
loop_total += ibs;
139
0 commit comments