@@ -7,32 +7,28 @@ namespace common {
77using namespace cub ;
88
99cudaError_t sort_keys (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_keys_in, unsigned *d_keys_out, int num_items, int begin_bit,
10- int end_bit, cudaStream_t stream, bool debug_synchronous ) {
11- return DeviceRadixSort::SortKeys (d_temp_storage, temp_storage_bytes, d_keys_in, d_keys_out, num_items, begin_bit, end_bit, stream, debug_synchronous );
10+ int end_bit, cudaStream_t stream) {
11+ return DeviceRadixSort::SortKeys (d_temp_storage, temp_storage_bytes, d_keys_in, d_keys_out, num_items, begin_bit, end_bit, stream);
1212}
1313
1414cudaError_t sort_pairs (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_keys_in, unsigned *d_keys_out, const unsigned *d_values_in,
15- unsigned *d_values_out, int num_items, int begin_bit, int end_bit, cudaStream_t stream, bool debug_synchronous) {
16- return DeviceRadixSort::SortPairs (d_temp_storage, temp_storage_bytes, d_keys_in, d_keys_out, d_values_in, d_values_out, num_items, begin_bit, end_bit, stream,
17- debug_synchronous);
15+ unsigned *d_values_out, int num_items, int begin_bit, int end_bit, cudaStream_t stream) {
16+ return DeviceRadixSort::SortPairs (d_temp_storage, temp_storage_bytes, d_keys_in, d_keys_out, d_values_in, d_values_out, num_items, begin_bit, end_bit, stream);
1817}
1918
2019cudaError_t sort_pairs_descending (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_keys_in, unsigned *d_keys_out,
21- const unsigned *d_values_in, unsigned *d_values_out, int num_items, int begin_bit, int end_bit, cudaStream_t stream,
22- bool debug_synchronous) {
20+ const unsigned *d_values_in, unsigned *d_values_out, int num_items, int begin_bit, int end_bit, cudaStream_t stream) {
2321 return DeviceRadixSort::SortPairsDescending (d_temp_storage, temp_storage_bytes, d_keys_in, d_keys_out, d_values_in, d_values_out, num_items, begin_bit,
24- end_bit, stream, debug_synchronous );
22+ end_bit, stream);
2523}
2624
2725cudaError_t run_length_encode (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_in, unsigned *d_unique_out, unsigned *d_counts_out,
28- unsigned *d_num_runs_out, int num_items, cudaStream_t stream, bool debug_synchronous) {
29- return DeviceRunLengthEncode::Encode (d_temp_storage, temp_storage_bytes, d_in, d_unique_out, d_counts_out, d_num_runs_out, num_items, stream,
30- debug_synchronous);
26+ unsigned *d_num_runs_out, int num_items, cudaStream_t stream) {
27+ return DeviceRunLengthEncode::Encode (d_temp_storage, temp_storage_bytes, d_in, d_unique_out, d_counts_out, d_num_runs_out, num_items, stream);
3128}
3229
33- cudaError_t exclusive_sum (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_in, unsigned *d_out, int num_items, cudaStream_t stream,
34- bool debug_synchronous) {
35- return DeviceScan::ExclusiveSum (d_temp_storage, temp_storage_bytes, d_in, d_out, num_items, stream, debug_synchronous);
30+ cudaError_t exclusive_sum (void *d_temp_storage, size_t &temp_storage_bytes, const unsigned *d_in, unsigned *d_out, int num_items, cudaStream_t stream) {
31+ return DeviceScan::ExclusiveSum (d_temp_storage, temp_storage_bytes, d_in, d_out, num_items, stream);
3632}
3733
3834} // namespace common
@@ -51,21 +47,20 @@ struct fq_mul {
5147 __device__ __forceinline__ storage operator ()(const storage &a, const storage &b) const { return fd_q::mul (a, b); }
5248};
5349
54- cudaError_t sum (void *d_temp_storage, size_t &temp_storage_bytes, const fd_q::storage *d_in, fd_q::storage *d_out, int num_items, cudaStream_t stream,
55- bool debug_synchronous) {
56- return DeviceReduce::Reduce (d_temp_storage, temp_storage_bytes, d_in, d_out, num_items, fq_add (), fd_q::storage (), stream, debug_synchronous);
50+ cudaError_t sum (void *d_temp_storage, size_t &temp_storage_bytes, const fd_q::storage *d_in, fd_q::storage *d_out, int num_items, cudaStream_t stream) {
51+ return DeviceReduce::Reduce (d_temp_storage, temp_storage_bytes, d_in, d_out, num_items, fq_add (), fd_q::storage (), stream);
5752}
5853
5954cudaError_t inclusive_prefix_product (void *d_temp_storage, size_t &temp_storage_bytes, const fd_q::storage *d_in, fd_q::storage *d_out, int num_items,
60- cudaStream_t stream, bool debug_synchronous ) {
61- return DeviceScan::InclusiveScan (d_temp_storage, temp_storage_bytes, d_in, d_out, fq_mul (), num_items, stream, debug_synchronous );
55+ cudaStream_t stream) {
56+ return DeviceScan::InclusiveScan (d_temp_storage, temp_storage_bytes, d_in, d_out, fq_mul (), num_items, stream);
6257}
6358
6459cudaError_t inclusive_prefix_product_reverse (void *d_temp_storage, size_t &temp_storage_bytes, const fd_q::storage *d_in, fd_q::storage *d_out, int num_items,
65- cudaStream_t stream, bool debug_synchronous ) {
60+ cudaStream_t stream) {
6661 auto i_in = std::reverse_iterator (d_in + num_items);
6762 auto i_out = std::reverse_iterator (d_out + num_items);
68- return DeviceScan::InclusiveScan (d_temp_storage, temp_storage_bytes, i_in, i_out, fq_mul (), num_items, stream, debug_synchronous );
63+ return DeviceScan::InclusiveScan (d_temp_storage, temp_storage_bytes, i_in, i_out, fq_mul (), num_items, stream);
6964}
7065
7166} // namespace ff
0 commit comments