adding chunk batch

nirandaperera · nirandaperera · commit fd59be46217d · 2025-05-06T13:51:08.000-07:00
Signed-off-by: niranda perera &lt;niranda.perera@gmail.com&gt;
diff --git a/cpp/include/rapidsmpf/shuffler/chunk.hpp b/cpp/include/rapidsmpf/shuffler/chunk.hpp
@@ -27,6 +27,8 @@ namespace rapidsmpf::shuffler::detail {
 using ChunkID = std::uint64_t;
 
 /**
+ * @brief Chunk with multiple messages.
+ * 
  * Format:
  * - chunk_id: uint64_t, ID of the chunk
  * - n_elements: size_t, Number of messages in the chunk
@@ -123,8 +125,11 @@ class ChunkBatch {
      *
      * @param i The index of the message.
      * @return A new ChunkBatch containing the data of the i-th message.
-     * @note This will create a copy of the packed data. If i==0 and n_messages() == 1 and
-     * the message is a data message, the data buffer will be moved to the new ChunkBatch.
+     * @note This will create a copy of the packed data. If there is only one message and
+     * the message is a data message, the buffers will be moved to the new ChunkBatch.
+     * Otherwise a new ChunkBatch will be created by copying data. 
+     *
+     * @throws std::out_of_range if the index is out of bounds.
      */
     ChunkBatch get_data(ChunkID new_chunk_id, size_t i, rmm::cuda_stream_view stream);
 
@@ -185,11 +190,16 @@ class ChunkBatch {
      * @param chunk_id The ID of the chunk.
      * @param part_id The ID of the partition.
      * @param packed_data The packed data.
+     * @param stream The CUDA stream.
      * @param br The buffer resource.
      * @return The ChunkBatch.
      */
     static ChunkBatch from_packed_data(
-        ChunkID chunk_id, PartID part_id, PackedData&& packed_data, BufferResource* br
+        ChunkID chunk_id,
+        PartID part_id,
+        PackedData&& packed_data,
+        rmm::cuda_stream_view stream,
+        BufferResource* br
     );
 
     /**
@@ -228,7 +238,6 @@ class ChunkBatch {
      */
     static bool validate_metadata_format(std::vector<uint8_t> const& metadata_buf);
 
-
   private:
     /// @brief The beginning of the partition IDs in the chunk.
     inline PartID* part_ids_begin() const {
diff --git a/cpp/src/shuffler/chunk.cpp b/cpp/src/shuffler/chunk.cpp
@@ -145,21 +145,10 @@ ChunkBatch ChunkBatch::get_data(
         return from_finished_partition(new_chunk_id, part_id(i), expected_num_chunks(i));
     }
 
-    // Calculate the offset and size of the metadata and data
-    uint32_t meta_offset = i == 0 ? 0 : *(psum_meta_begin() + i - 1);
-    uint32_t meta_size = metadata_size(i);
-    // uint64_t data_offset = i == 0 ? 0 : *(psum_data_begin() + i - 1);
-    uint64_t data_size = this->data_size(i);
-
     ChunkBatch new_chunk;
-
-    // Create metadata vector
-    new_chunk.metadata_ = std::make_unique<std::vector<uint8_t>>(
-        concat_metadata_begin() + meta_offset,
-        concat_metadata_begin() + meta_offset + meta_size
-    );
-
-    if (n_messages() == 1 && data_size > 0) {  // i == 0, already veried
+    if (n_messages() == 1) {  // i == 0, already verified
+        // If there is only one message, move the metadata and data to the new chunk.
+        new_chunk.metadata_ = std::move(metadata_);
         new_chunk.data_ = std::move(data_);
     } else {
         RAPIDSMPF_EXPECTS(false, "not implemented");
@@ -170,7 +159,11 @@ ChunkBatch ChunkBatch::get_data(
 }
 
 ChunkBatch ChunkBatch::from_packed_data(
-    ChunkID chunk_id, PartID part_id, PackedData&& packed_data, BufferResource* br
+    ChunkID chunk_id,
+    PartID part_id,
+    PackedData&& packed_data,
+    rmm::cuda_stream_view stream,
+    BufferResource* br
 ) {
     ChunkBatch chunk;
     size_t metadata_buf_size =
@@ -214,7 +207,11 @@ ChunkBatch ChunkBatch::from_packed_data(
         // Write data size
         *reinterpret_cast<uint64_t*>(chunk.psum_data_begin()) =
             packed_data.gpu_data->size();
-        chunk.data_ = br->move(std::move(packed_data.gpu_data));
+        chunk.data_ = br->move(
+            std::move(packed_data.gpu_data),
+            stream,
+            std::make_shared<Buffer::Event>(stream)
+        );
     }
 
     return chunk;
diff --git a/cpp/tests/test_chunk.cpp b/cpp/tests/test_chunk.cpp
@@ -17,9 +17,11 @@ class ChunkBatchTest : public ::testing::Test {
   protected:
     void SetUp() override {
         br = std::make_unique<BufferResource>(cudf::get_current_device_resource_ref());
+        stream = cudf::get_default_stream();
     }
 
     std::unique_ptr<BufferResource> br;
+    rmm::cuda_stream_view stream;
 };
 
 TEST_F(ChunkBatchTest, FromFinishedPartition) {
@@ -44,110 +46,52 @@ TEST_F(ChunkBatchTest, FromFinishedPartition) {
     auto chunk2 = ChunkBatch::from_metadata_message(chunk.release_metadata_buffer());
     test_chunk(chunk2);
 
-    auto chunk3 = chunk2.get_data(chunk_id, 0, cudf::get_default_stream());
+    auto chunk3 = chunk2.get_data(chunk_id, 0, stream);
     test_chunk(chunk3);
+
+    EXPECT_THROW(chunk3.get_data(chunk_id, 1, stream), std::out_of_range);
 }
 
-// TEST_F(ChunkBatchTest, FromPackedData) {
-//     ChunkID chunk_id = 123;
-//     PartID part_id = 456;
-
-//     // Create test metadata
-//     auto metadata = std::make_unique<std::vector<uint8_t>>(4);
-//     metadata->at(0) = 1;
-//     metadata->at(1) = 2;
-//     metadata->at(2) = 3;
-//     metadata->at(3) = 4;
-
-//     // Create test GPU data
-//     auto gpu_data = br->allocate(MemoryType::DEVICE, 4);
-//     uint8_t host_data[4] = {5, 6, 7, 8};
-//     CUDA_TRY(cudaMemcpy(gpu_data->data, host_data, 4, cudaMemcpyHostToDevice));
-
-//     PackedData packed_data{std::move(metadata), std::move(gpu_data)};
-//     auto chunk =
-//         ChunkBatch::from_packed_data(chunk_id, part_id, std::move(packed_data),
-//         br.get());
-
-//     EXPECT_EQ(chunk.chunk_id(), chunk_id);
-//     EXPECT_EQ(chunk.n_messages(), 1);
-//     EXPECT_EQ(chunk.part_id(0), part_id);
-//     EXPECT_EQ(chunk.expected_num_chunks(0), 0);
-//     EXPECT_FALSE(chunk.is_control_message(0));
-//     EXPECT_EQ(chunk.metadata_size(0), 4);
-//     EXPECT_EQ(chunk.data_size(0), 4);
-// }
-
-// TEST_F(ChunkBatchTest, ValidateMetadataFormat) {
-//     // Test valid metadata format
-//     auto valid_chunk = ChunkBatch::from_finished_partition(123, 456, 789);
-//     EXPECT_TRUE(ChunkBatch::validate_metadata_format(*valid_chunk.release_metadata_buffer(
-//     )));
-
-//     // Test invalid metadata format (too small)
-//     std::vector<uint8_t> too_small(4);
-//     EXPECT_FALSE(ChunkBatch::validate_metadata_format(too_small));
-
-//     // Test invalid metadata format (zero messages)
-//     std::vector<uint8_t> zero_messages(16);
-//     *reinterpret_cast<ChunkID*>(zero_messages.data()) = 123;
-//     *reinterpret_cast<size_t*>(zero_messages.data() + sizeof(ChunkID)) = 0;
-//     EXPECT_FALSE(ChunkBatch::validate_metadata_format(zero_messages));
-// }
-
-// TEST_F(ChunkBatchTest, GetData) {
-//     ChunkID chunk_id = 123;
-//     PartID part_id = 456;
-
-//     // Create test metadata
-//     auto metadata = std::make_unique<std::vector<uint8_t>>(4);
-//     metadata->at(0) = 1;
-//     metadata->at(1) = 2;
-//     metadata->at(2) = 3;
-//     metadata->at(3) = 4;
-
-//     // Create test GPU data
-//     auto gpu_data = br->allocate(MemoryType::DEVICE, 4);
-//     uint8_t host_data[4] = {5, 6, 7, 8};
-//     CUDA_TRY(cudaMemcpy(gpu_data->data, host_data, 4, cudaMemcpyHostToDevice));
-
-//     PackedData packed_data{std::move(metadata), std::move(gpu_data)};
-//     auto chunk =
-//         ChunkBatch::from_packed_data(chunk_id, part_id, std::move(packed_data),
-//         br.get());
-
-//     // Test getting data from a data message
-//     auto new_chunk = chunk.get_data(789, 0, cudf::get_default_stream());
-//     EXPECT_EQ(new_chunk.chunk_id(), 789);
-//     EXPECT_EQ(new_chunk.n_messages(), 1);
-//     EXPECT_EQ(new_chunk.part_id(0), part_id);
-//     EXPECT_EQ(new_chunk.metadata_size(0), 4);
-//     EXPECT_EQ(new_chunk.data_size(0), 4);
-
-//     // Test getting data from a control message
-//     auto control_chunk = ChunkBatch::from_finished_partition(123, 456, 789);
-//     auto new_control_chunk = control_chunk.get_data(999, 0,
-//     cudf::get_default_stream()); EXPECT_EQ(new_control_chunk.chunk_id(), 999);
-//     EXPECT_EQ(new_control_chunk.n_messages(), 1);
-//     EXPECT_EQ(new_control_chunk.part_id(0), 456);
-//     EXPECT_EQ(new_control_chunk.expected_num_chunks(0), 789);
-//     EXPECT_TRUE(new_control_chunk.is_control_message(0));
-// }
-
-// TEST_F(ChunkBatchTest, FromMetadataMessage) {
-//     // Create a chunk and convert it to metadata message
-//     auto original_chunk = ChunkBatch::from_finished_partition(123, 456, 789);
-//     auto metadata_msg = original_chunk.release_metadata_buffer();
-
-//     // Create new chunk from metadata message
-//     auto new_chunk = ChunkBatch::from_metadata_message(std::move(metadata_msg));
-
-//     EXPECT_EQ(new_chunk.chunk_id(), 123);
-//     EXPECT_EQ(new_chunk.n_messages(), 1);
-//     EXPECT_EQ(new_chunk.part_id(0), 456);
-//     EXPECT_EQ(new_chunk.expected_num_chunks(0), 789);
-//     EXPECT_TRUE(new_chunk.is_control_message(0));
-// }
+TEST_F(ChunkBatchTest, FromPackedData) {
+    ChunkID chunk_id = 123;
+    PartID part_id = 456;
+
+    // Create test metadata
+    auto metadata =
+        std::make_unique<std::vector<uint8_t>>(std::vector<uint8_t>{1, 2, 3, 4});
+
+    // Create test GPU data
+    auto data = std::make_unique<rmm::device_buffer>(4, cudf::get_default_stream());
+    std::vector<uint8_t> host_data{5, 6, 7, 8};
+    RAPIDSMPF_CUDA_TRY(
+        cudaMemcpy(data->data(), host_data.data(), 4, cudaMemcpyHostToDevice)
+    );
+
+    PackedData packed_data{
+        std::make_unique<std::vector<uint8_t>>(*metadata), std::move(data)
+    };
+
+    auto test_chunk = [&](ChunkBatch& chunk) {
+        EXPECT_EQ(chunk.chunk_id(), chunk_id);
+        EXPECT_EQ(chunk.n_messages(), 1);
+        EXPECT_EQ(chunk.part_id(0), part_id);
+        EXPECT_EQ(chunk.expected_num_chunks(0), 0);
+        EXPECT_FALSE(chunk.is_control_message(0));
+        EXPECT_EQ(chunk.metadata_size(0), 4);
+        EXPECT_EQ(chunk.data_size(0), 4);
+    };
+    auto chunk = ChunkBatch::from_packed_data(
+        chunk_id, part_id, std::move(packed_data), stream, br.get()
+    );
+    test_chunk(chunk);
+
+    auto chunk2 = ChunkBatch::from_metadata_message(chunk.release_metadata_buffer());
+    chunk2.set_data_buffer(chunk.release_data_buffer());
+    test_chunk(chunk2);
+
+    auto chunk3 = chunk2.get_data(chunk_id, 0, stream);
+    test_chunk(chunk3);
+}
 
 }  // namespace test
 }  // namespace rapidsmpf::shuffler::detail