[OPIK-3515] [FE]: fix playground streaming with responses of unfinished lines; (#4488)

aadereiko · aadereiko · web-flow · commit 6d1f5def4ff6 · 2025-12-18T11:59:36.000+01:00
* [OPIK-3515]: fix playground streaming with responses of unfinished lines;

* fix eslint issues;

---------

Co-authored-by: aadereiko &lt;aliaksandr@comet.com&gt;
diff --git a/apps/opik-frontend/src/api/playground/useCompletionProxyStreaming.test.ts b/apps/opik-frontend/src/api/playground/useCompletionProxyStreaming.test.ts
@@ -0,0 +1,236 @@
+import { describe, expect, it } from "vitest";
+import { processSSEChunk } from "./useCompletionProxyStreaming";
+
+describe("processSSEChunk", () => {
+  describe("basic line processing", () => {
+    it("should process a single complete line", () => {
+      const result = processSSEChunk(
+        'data: {"choices":[{"delta":{"content":"hello"}}]}\n',
+        "",
+      );
+      expect(result.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"hello"}}]}',
+      ]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should process multiple complete lines", () => {
+      const result = processSSEChunk(
+        'data: {"choices":[{"delta":{"content":"hello"}}]}\ndata: {"choices":[{"delta":{"content":" world"}}]}\n',
+        "",
+      );
+      expect(result.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"hello"}}]}',
+        'data: {"choices":[{"delta":{"content":" world"}}]}',
+      ]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should skip empty lines", () => {
+      const result = processSSEChunk(
+        'data: {"content":"a"}\n\n\ndata: {"content":"b"}\n',
+        "",
+      );
+      expect(result.lines).toEqual([
+        'data: {"content":"a"}',
+        'data: {"content":"b"}',
+      ]);
+      expect(result.newBuffer).toBe("");
+    });
+  });
+
+  describe("buffering incomplete lines", () => {
+    it("should buffer an incomplete line (no trailing newline)", () => {
+      const result = processSSEChunk(
+        'data: {"choices":[{"delta":{"content":"hello"}}]}\ndata: {"choi',
+        "",
+      );
+      expect(result.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"hello"}}]}',
+      ]);
+      expect(result.newBuffer).toBe('data: {"choi');
+    });
+
+    it("should prepend buffer to next chunk and complete the line", () => {
+      // First chunk ends with incomplete line
+      const result1 = processSSEChunk(
+        'data: {"choices":[{"delta":{"content":"hello"}}]}\ndata: {"choi',
+        "",
+      );
+      expect(result1.newBuffer).toBe('data: {"choi');
+
+      // Second chunk completes the line
+      const result2 = processSSEChunk(
+        'ces":[{"delta":{"content":","}}]}\n',
+        result1.newBuffer,
+      );
+      expect(result2.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":","}}]}',
+      ]);
+      expect(result2.newBuffer).toBe("");
+    });
+
+    it("should handle line split across multiple chunks", () => {
+      // Simulate a JSON line split across 3 chunks
+      const result1 = processSSEChunk('data: {"choices":[{"del', "");
+      expect(result1.lines).toEqual([]);
+      expect(result1.newBuffer).toBe('data: {"choices":[{"del');
+
+      const result2 = processSSEChunk(
+        'ta":{"content":"test',
+        result1.newBuffer,
+      );
+      expect(result2.lines).toEqual([]);
+      expect(result2.newBuffer).toBe(
+        'data: {"choices":[{"delta":{"content":"test',
+      );
+
+      const result3 = processSSEChunk('"}}]}\n', result2.newBuffer);
+      expect(result3.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"test"}}]}',
+      ]);
+      expect(result3.newBuffer).toBe("");
+    });
+  });
+
+  describe("edge cases", () => {
+    it("should handle empty chunk with buffer", () => {
+      const result = processSSEChunk("", 'data: {"partial":');
+      expect(result.lines).toEqual([]);
+      expect(result.newBuffer).toBe('data: {"partial":');
+    });
+
+    it("should handle chunk that is only newlines", () => {
+      const result = processSSEChunk("\n\n\n", "");
+      expect(result.lines).toEqual([]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should handle buffer that becomes complete with newline chunk", () => {
+      const result = processSSEChunk(
+        "\n",
+        'data: {"choices":[{"delta":{"content":"x"}}]}',
+      );
+      expect(result.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"x"}}]}',
+      ]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should handle whitespace-only lines (should be filtered)", () => {
+      const result = processSSEChunk("   \n\t\n", "");
+      expect(result.lines).toEqual([]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should handle chunk ending exactly at newline", () => {
+      const result = processSSEChunk('data: {"content":"a"}\n', "");
+      expect(result.lines).toEqual(['data: {"content":"a"}']);
+      expect(result.newBuffer).toBe("");
+    });
+  });
+
+  describe("real-world scenarios", () => {
+    it("should preserve content when SSE message is split mid-JSON", () => {
+      const chunk1 =
+        'data: {"choices":[{"delta":{"content":"hello"}}]}\ndata: {"choi';
+      const chunk2 = 'ces":[{"delta":{"content":","}}]}\n';
+
+      const result1 = processSSEChunk(chunk1, "");
+      expect(result1.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":"hello"}}]}',
+      ]);
+      expect(result1.newBuffer).toBe('data: {"choi');
+
+      const result2 = processSSEChunk(chunk2, result1.newBuffer);
+      expect(result2.lines).toEqual([
+        'data: {"choices":[{"delta":{"content":","}}]}',
+      ]);
+      expect(result2.newBuffer).toBe("");
+    });
+
+    it("should handle streaming with usage info at the end", () => {
+      const chunks = [
+        'data: {"choices":[{"delta":{"content":"Hi"}}]}\ndata: {"choi',
+        'ces":[{"delta":{"content":"!"}}]}\n',
+        'data: {"choices":[],"usage":{"prompt_tokens":10,"completion_tokens":2}}\n',
+      ];
+
+      let buffer = "";
+      const allLines: string[] = [];
+
+      for (const chunk of chunks) {
+        const result = processSSEChunk(chunk, buffer);
+        allLines.push(...result.lines);
+        buffer = result.newBuffer;
+      }
+
+      expect(allLines).toEqual([
+        'data: {"choices":[{"delta":{"content":"Hi"}}]}',
+        'data: {"choices":[{"delta":{"content":"!"}}]}',
+        'data: {"choices":[],"usage":{"prompt_tokens":10,"completion_tokens":2}}',
+      ]);
+      expect(buffer).toBe("");
+    });
+
+    it("should handle [DONE] signal", () => {
+      const result = processSSEChunk("data: [DONE]\n", "");
+      expect(result.lines).toEqual(["data: [DONE]"]);
+      expect(result.newBuffer).toBe("");
+    });
+
+    it("should preserve comma in JSON schema output - qwen model scenario", () => {
+      const chunks = [
+        'data: {"choices":[{"delta":{"content":"[\\"wedding surprise reactions|0.86\\""}}]}\n',
+        'data: {"choices":[{"delta":{"content":","}}]}\ndata: {"ch',
+        'oices":[{"delta":{"content":" \\"beach sunset|0.92\\"]"}}]}\n',
+      ];
+
+      let buffer = "";
+      const allLines: string[] = [];
+
+      for (const chunk of chunks) {
+        const result = processSSEChunk(chunk, buffer);
+        allLines.push(...result.lines);
+        buffer = result.newBuffer;
+      }
+
+      expect(allLines).toHaveLength(3);
+      expect(allLines[0]).toContain("wedding surprise reactions|0.86");
+      expect(allLines[1]).toContain(",");
+      expect(allLines[2]).toContain("beach sunset|0.92");
+      expect(buffer).toBe("");
+    });
+
+    it("should handle JSON with pipe-separated values split across many chunks", () => {
+      const chunks = [
+        'data: {"choices":[{"delta":{"content":"wedding surprise reactions|0.86"}}]}\n',
+        'data: {"choices":[{"delta":{"content":","}}]}\ndata: {"choices":[{"del',
+        'ta":{"content":" beach|0.75"}}]}\n',
+      ];
+
+      let buffer = "";
+      const allLines: string[] = [];
+
+      for (const chunk of chunks) {
+        const result = processSSEChunk(chunk, buffer);
+        allLines.push(...result.lines);
+        buffer = result.newBuffer;
+      }
+
+      expect(allLines).toHaveLength(3);
+      expect(allLines[0]).toContain("wedding surprise reactions|0.86");
+      expect(allLines[1]).toContain(",");
+      expect(allLines[2]).toContain("beach|0.75");
+      expect(buffer).toBe("");
+
+      const contentParts = allLines.map((line) => {
+        const match = line.match(/"content":"([^"]*)"/);
+        return match ? match[1] : "";
+      });
+      const fullContent = contentParts.join("");
+
+      expect(fullContent).toBe("wedding surprise reactions|0.86, beach|0.75");
+    });
+  });
+});
diff --git a/apps/opik-frontend/src/api/playground/useCompletionProxyStreaming.ts b/apps/opik-frontend/src/api/playground/useCompletionProxyStreaming.ts
@@ -18,6 +18,30 @@ import { ProviderMessageType } from "@/types/llm";
 
 const DATA_PREFIX = "data:";
 
+/**
+ * Processes SSE chunk data with buffering for incomplete lines.
+ * SSE messages can be split across network chunks, so we buffer incomplete
+ * lines and only process complete lines (those ending with newline).
+ */
+export const processSSEChunk = (
+  chunk: string,
+  buffer: string,
+): { lines: string[]; newBuffer: string } => {
+  const data = buffer + chunk;
+  const lines = data.split("\n");
+
+  // if the data doesn't end with newline, the last element is incomplete
+  // save it for the next iteration
+  let newBuffer = "";
+  if (!data.endsWith("\n")) {
+    newBuffer = lines.pop() || "";
+  }
+
+  const completeLines = lines.filter((line) => line.trim() !== "");
+
+  return { lines: completeLines, newBuffer };
+};
+
 const getNowUtcTimeISOString = (): string => {
   return dayjs().utc().toISOString();
 };
@@ -192,6 +216,9 @@ const useCompletionProxyStreaming = ({
           }
         };
 
+        // buffer to hold incomplete lines across chunks
+        let lineBuffer = "";
+
         // an analogue of true && reader
         // we need it to wait till the stream is closed
         while (reader) {
@@ -202,7 +229,8 @@ const useCompletionProxyStreaming = ({
           }
 
           const chunk = decoder.decode(value, { stream: true });
-          const lines = chunk.split("\n").filter((line) => line.trim() !== "");
+          const { lines, newBuffer } = processSSEChunk(chunk, lineBuffer);
+          lineBuffer = newBuffer;
 
           for (const line of lines) {
             const JSONData = line.startsWith(DATA_PREFIX)