diff --git a/perception/autoware_tensorrt_plugins/src/scatter_ops/segment_csr.cu b/perception/autoware_tensorrt_plugins/src/scatter_ops/segment_csr.cu index e4d5484d3c3af..1ab2367f79a74 100644 --- a/perception/autoware_tensorrt_plugins/src/scatter_ops/segment_csr.cu +++ b/perception/autoware_tensorrt_plugins/src/scatter_ops/segment_csr.cu @@ -130,13 +130,8 @@ int32_t segment_csr_launch( fill_kernel <<>>(arg_indices_out, out_numel, num_rows_in); - scalar_t * base_values{nullptr}; - cudaMallocAsync(&base_values, sizeof(scalar_t) * out_numel, stream_in); fill_kernel<<>>( - base_values, out_numel, static_cast(0)); - cudaMemcpyAsync( - reduced_values_out, base_values, sizeof(scalar_t) * out_numel, cudaMemcpyDeviceToDevice, - stream_in); + reduced_values_out, out_numel, static_cast(0)); if (num_cols_in == 1) segment_csr_kernel<<>>( @@ -145,8 +140,6 @@ int32_t segment_csr_launch( segment_csr_broadcast_kernel <<>>( src_in, indptr_in, reduced_values_out, arg_indices_out, num_segments, num_cols_in); - - cudaFreeAsync(base_values, stream_in); return 0; }