test_lora_llama3_8b_async_with_custom_code - increase output length (deepjavalibrary#2990)

smouaa · web-flow · commit c3006110256d · 2026-01-25T19:36:06.000-08:00
diff --git a/tests/integration/llm/client.py b/tests/integration/llm/client.py
@@ -201,7 +201,7 @@ def get_model_name():
     "llama3-8b-unmerged-lora-with-custom-code": {
         "option.model_id": "s3://djl-llm/llama-3-8b-instruct-hf/",
         "batch_size": [4],
-        "seq_length": [16, 32],
+        "seq_length": [32, 64],
         "worker": 1,
         "adapters": ["medical", "exam"],
         "tokenizer": "unsloth/llama-3-8b-Instruct",
@@ -821,6 +821,9 @@ def extract_chat_content(response_content):
         line = line.strip()
         if not line:
             continue
+
+        if line.startswith("data: "):
+            line = line[6:]  # Remove "data: " prefix
         try:
             parsed = json.loads(line)
             # Non-streaming chat completion format
@@ -1576,6 +1579,16 @@ def response_checker(res, message):
             for item in message.split('\n'):
                 item = item.strip()
                 if len(item) > 0:
+                    if item.startswith('data: '):
+                        item = item[6:]  # Remove "data: " prefix
+
+                    # Skip [DONE] markers
+                    if item == '[DONE]':
+                        continue
+
+                    # Skip empty items after stripping
+                    if not item:
+                        continue
                     try:
                         json_lines.append(json.loads(item))
                     except json.JSONDecodeError as e:
@@ -1714,6 +1727,18 @@ def check_output_formatter_applied(response_text, expected_identifier):
         line = line.strip()
         if not line:
             continue
+
+        if line.startswith('data: '):
+            line = line[6:]  # Remove "data: " prefix
+
+        # Skip [DONE] markers
+        if line == '[DONE]':
+            continue
+
+        # Skip empty lines after stripping
+        if not line:
+            continue
+
         try:
             parsed_json = json.loads(line)
             # Check for text completion format