🐛 Bugfix: skill names and descriptions never load to context (#3207)

Jasonxia007 · web-flow · commit 54bee0f95930 · 2026-06-09T15:56:25.000+08:00
🐛 Bugfix: official skills not copied to target directory
diff --git a/backend/agents/create_agent_info.py b/backend/agents/create_agent_info.py
@@ -433,25 +433,6 @@ async def create_agent_config(
     }
     system_prompt = Template(prompt_template["system_prompt"], undefined=StrictUndefined).render(render_kwargs)
 
-    context_components = build_context_components(
-        duty=duty_prompt,
-        constraint=constraint_prompt,
-        few_shots=few_shots_prompt,
-        app_name=app_name,
-        app_description=app_description,
-        time_str=time_str,
-        user_id=user_id,
-        language=language,
-        is_manager=is_manager,
-        tools=render_kwargs["tools"],
-        skills=skills,
-        managed_agents=render_kwargs["managed_agents"],
-        external_a2a_agents=render_kwargs["external_a2a_agents"],
-        memory_list=memory_list,
-        memory_search_query=last_user_query,
-        knowledge_base_summary=knowledge_base_summary,
-    )
-
     model_id_to_use = override_model_id if override_model_id else agent_info.get("model_id")
     model_max_tokens = 10000
     if model_id_to_use is not None:
@@ -461,8 +442,33 @@ async def create_agent_config(
             model_max_tokens = model_info["max_tokens"]
     else:
         model_name = "main_model"
-    # Use agent-level setting for context management, default to False
+
+    # Use agent-level setting for context management, default to False.
+    # When ContextManager is disabled, do not attach context_components because
+    # downstream runtime may prefer component-based prompt assembly over the
+    # rendered system_prompt, causing the actual model input to diverge from the
+    # template output.
     enable_context_manager = agent_info.get("enable_context_manager", False)
+    context_components = []
+    if enable_context_manager:
+        context_components = build_context_components(
+            duty=duty_prompt,
+            constraint=constraint_prompt,
+            few_shots=few_shots_prompt,
+            app_name=app_name,
+            app_description=app_description,
+            time_str=time_str,
+            user_id=user_id,
+            language=language,
+            is_manager=is_manager,
+            tools=render_kwargs["tools"],
+            skills=skills,
+            managed_agents=render_kwargs["managed_agents"],
+            external_a2a_agents=render_kwargs["external_a2a_agents"],
+            memory_list=memory_list,
+            memory_search_query=last_user_query,
+            knowledge_base_summary=knowledge_base_summary,
+        )
     cm_config = ContextManagerConfig(
         enabled=enable_context_manager,
         token_threshold=model_max_tokens,
diff --git a/docker/deploy.sh b/docker/deploy.sh
@@ -796,6 +796,15 @@ prepare_directory_and_data() {
   create_dir_with_permission "$NEXENT_USER_DIR" 775
   echo "   🖥️  Nexent user workspace: $NEXENT_USER_DIR"
 
+  # Copy official-skills-zip folder to /mnt/nexent
+  if [ -d "official-skills-zip" ]; then
+    cp -rn official-skills-zip "$NEXENT_USER_DIR/"
+    chmod -R 775 "$NEXENT_USER_DIR/official-skills-zip"
+    echo "   📦 Official skills copied to $NEXENT_USER_DIR/official-skills-zip"
+  else
+    echo "   ⚠️ official-skills-zip directory not found, skipping skills copy"
+  fi
+
   # Export for docker-compose
   export NEXENT_USER_DIR
 
@@ -1358,7 +1367,7 @@ main_deploy() {
   echo "--------------------------------"
   echo ""
 
-  APP_VERSION="$(get_app_version)"
+  APP_VERSION="latest"
   if [ -z "$APP_VERSION" ]; then
     echo "❌ Failed to get app version, please check the backend/consts/const.py file"
     exit 1
diff --git a/sdk/nexent/core/agents/agent_model.py b/sdk/nexent/core/agents/agent_model.py
@@ -311,12 +311,11 @@ def to_messages(self) -> List[Dict[str, str]]:
             return [{"role": "system", "content": self.formatted_description}]
         return []
 
-    def add_skill(self, name: str, description: str, examples: List[str] = None) -> None:
+    def add_skill(self, name: str, description: str) -> None:
         """Add a skill definition."""
         self.skills.append({
             "name": name,
-            "description": description,
-            "examples": examples or []
+            "description": description
         })
 
 
diff --git a/test/backend/agents/test_create_agent_info.py b/test/backend/agents/test_create_agent_info.py
@@ -3835,6 +3835,52 @@ async def test_join_minio_file_description_to_query_current_files_priority(self)
         pos_history = result.find("history_2.pdf")
         assert pos_current < pos_history, "Current message files should appear before history files"
 
+    def test_format_minio_files_for_content_formats_presigned_urls(self):
+        """History attachment formatting should include both internal and external URLs."""
+        result = _format_minio_files_for_content(
+            [
+                {
+                    "name": "report.pdf",
+                    "object_name": "tenant-a/report.pdf",
+                    "presigned_url": "https://signed.example/report.pdf",
+                }
+            ]
+        )
+
+        assert result.startswith("\n[Attached files]:\n")
+        assert "report.pdf" in result
+        assert "s3://" in result
+        assert "presigned_url: https://signed.example/report.pdf" in result
+
+    def test_convert_history_with_minio_files_embeds_file_info(self):
+        """History items should preserve text and append formatted attachment details."""
+        history = [
+            HistoryItem(
+                role="user",
+                content="Please review this file",
+                minio_files=[
+                    {
+                        "name": "notes.txt",
+                        "object_name": "tenant-a/notes.txt",
+                    }
+                ],
+            ),
+            HistoryItem(role="assistant", content="Done", minio_files=None),
+        ]
+
+        result = _convert_history_with_minio_files(history)
+
+        assert len(result) == 2
+        assert result[0].role == "user"
+        assert result[0].content.startswith("Please review this file")
+        assert "[Attached files]:" in result[0].content
+        assert "notes.txt" in result[0].content
+        assert result[1].content == "Done"
+
+    def test_convert_history_with_minio_files_returns_none_for_none(self):
+        """None history should remain None for downstream SDK compatibility."""
+        assert _convert_history_with_minio_files(None) is None
+
 
 class TestPreparePromptTemplates:
     """Tests for the prepare_prompt_templates function"""
@@ -3865,6 +3911,22 @@ async def test_prepare_prompt_templates_worker_en(self):
             assert result["system_prompt"] == "test system prompt"
             assert result["test"] == "template"
 
+    @pytest.mark.asyncio
+    async def test_prepare_prompt_templates_overwrites_existing_system_prompt(self):
+        """Latest rendered system prompt should replace the template default."""
+        with patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template:
+            mock_get_template.return_value = {
+                "system_prompt": "stale prompt",
+                "user_prompt": "keep me",
+            }
+
+            result = await prepare_prompt_templates(False, "fresh system prompt", "en")
+
+            assert result == {
+                "system_prompt": "fresh system prompt",
+                "user_prompt": "keep me",
+            }
+
 
 class TestExtractUrlFromCard:
     """Tests for the _extract_url_from_card function"""
diff --git a/test/backend/test_document_vector_integration.py b/test/backend/test_document_vector_integration.py
@@ -1,8 +1,8 @@
 """
-Integration test for document vector operations
+Integration test for document vector operations.
 
-This test demonstrates the complete workflow from ES retrieval to clustering.
-Note: This requires a running Elasticsearch instance.
+This module validates the embedding and clustering workflow using deterministic
+fixtures so the clustering assertions stay stable across environments.
 """
 import os
 import sys
@@ -80,82 +80,84 @@
 
 
 class TestDocumentVectorIntegration:
-    """Integration tests for document vector operations"""
-    
+    """Integration tests for document vector operations."""
+
     def test_complete_workflow(self):
-        """Test complete workflow: embedding calculation -> clustering"""
-        # Simulate document chunks with embeddings
+        """Test complete workflow: embedding calculation -> clustering."""
         chunks_1 = [
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 1 chunk 1'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 1 chunk 2'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 1 chunk 3'}
+            {"embedding": [1.0, 0.0], "content": "Document one chunk A"},
+            {"embedding": [0.9, 0.1], "content": "Document one chunk B"},
+            {"embedding": [0.95, 0.05], "content": "Document one chunk C"},
         ]
-        
         chunks_2 = [
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 2 chunk 1'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 2 chunk 2'}
+            {"embedding": [0.0, 1.0], "content": "Document two chunk A"},
+            {"embedding": [0.1, 0.9], "content": "Document two chunk B"},
         ]
-        
         chunks_3 = [
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 3 chunk 1'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 3 chunk 2'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 3 chunk 3'},
-            {'embedding': np.random.rand(128).tolist(), 'content': 'Content for doc 3 chunk 4'}
+            {"embedding": [0.85, 0.15], "content": "Document three chunk A"},
+            {"embedding": [0.8, 0.2], "content": "Document three chunk B"},
+            {"embedding": [0.88, 0.12], "content": "Document three chunk C"},
+            {"embedding": [0.83, 0.17], "content": "Document three chunk D"},
         ]
-        
-        # Calculate document embeddings
+
         doc_embedding_1 = calculate_document_embedding(chunks_1, use_weighted=True)
         doc_embedding_2 = calculate_document_embedding(chunks_2, use_weighted=True)
         doc_embedding_3 = calculate_document_embedding(chunks_3, use_weighted=True)
-        
+
         assert doc_embedding_1 is not None
         assert doc_embedding_2 is not None
         assert doc_embedding_3 is not None
-        
-        # Create document embeddings dictionary
+
         doc_embeddings = {
-            'doc_001': doc_embedding_1,
-            'doc_002': doc_embedding_2,
-            'doc_003': doc_embedding_3
+            "doc_001": doc_embedding_1,
+            "doc_002": doc_embedding_2,
+            "doc_003": doc_embedding_3,
         }
-        
-        # Determine optimal K
+
         embeddings_array = np.array([doc_embedding_1, doc_embedding_2, doc_embedding_3])
         optimal_k = auto_determine_k(embeddings_array, min_k=2, max_k=3)
-        
-        assert 2 <= optimal_k <= 3
-        
-        # Perform clustering
+
+        assert optimal_k == 2
+
         clusters = kmeans_cluster_documents(doc_embeddings, k=optimal_k)
-        
+
         assert len(clusters) == optimal_k
         assert sum(len(docs) for docs in clusters.values()) == 3
-    
+        assert sorted(len(docs) for docs in clusters.values()) == [1, 2]
+
+        cluster_sets = [set(docs) for docs in clusters.values()]
+        assert {"doc_001", "doc_003"} in cluster_sets
+        assert {"doc_002"} in cluster_sets
+
     def test_large_dataset_clustering(self):
-        """Test clustering with larger simulated dataset"""
-        # Create simulated document embeddings
-        n_docs = 50
-        doc_embeddings = {
-            f'doc_{i:03d}': np.random.rand(128) for i in range(n_docs)
+        """Test clustering with a deterministic larger simulated dataset."""
+        cluster_a = {
+            f"doc_a_{i:03d}": np.array([1.0 + i * 0.002, 1.0 + i * 0.001, 0.2])
+            for i in range(20)
+        }
+        cluster_b = {
+            f"doc_b_{i:03d}": np.array([5.0 + i * 0.002, 5.0 + i * 0.001, 0.4])
+            for i in range(15)
+        }
+        cluster_c = {
+            f"doc_c_{i:03d}": np.array([9.0 + i * 0.002, 1.0 + i * 0.001, 0.6])
+            for i in range(15)
         }
-        
-        # Auto-determine K
+        doc_embeddings = {**cluster_a, **cluster_b, **cluster_c}
+        n_docs = len(doc_embeddings)
+
         embeddings_array = np.array(list(doc_embeddings.values()))
-        optimal_k = auto_determine_k(embeddings_array, min_k=3, max_k=15)
-        
-        assert 3 <= optimal_k <= 15
-        
-        # Cluster documents
-        clusters = kmeans_cluster_documents(doc_embeddings, k=optimal_k)
-        
-        assert len(clusters) == optimal_k
+        optimal_k = auto_determine_k(embeddings_array, min_k=3, max_k=6)
+
+        assert 3 <= optimal_k <= 6
+
+        clusters = kmeans_cluster_documents(doc_embeddings, k=3)
+
+        assert len(clusters) == 3
         assert sum(len(docs) for docs in clusters.values()) == n_docs
-        
-        # Verify cluster sizes are reasonable
-        cluster_sizes = [len(docs) for docs in clusters.values()]
-        assert min(cluster_sizes) >= 1
-        # Allow for some imbalance in clustering results (realistic for random data)
-        assert max(cluster_sizes) <= n_docs * 0.7  # No single cluster dominates too much
+
+        cluster_sizes = sorted(len(docs) for docs in clusters.values())
+        assert cluster_sizes == [15, 15, 20]
 
 
 if __name__ == '__main__':
diff --git a/test/sdk/core/agents/test_agent_model.py b/test/sdk/core/agents/test_agent_model.py
@@ -302,7 +302,11 @@ def test_model_config_creation_with_all_fields(self):
             temperature=0.7,
             top_p=0.9,
             ssl_verify=False,
-            model_factory="openai"
+            model_factory="openai",
+            extra_body={"chat_template_kwargs": {"enable_thinking": False}},
+            max_tokens=4096,
+            timeout_seconds=45.5,
+            concurrency_limit=3,
         )
         assert config.cite_name == "gpt-4"
         assert config.api_key == "sk-test-key"
@@ -312,6 +316,10 @@ def test_model_config_creation_with_all_fields(self):
         assert config.top_p == 0.9
         assert config.ssl_verify is False
         assert config.model_factory == "openai"
+        assert config.extra_body == {"chat_template_kwargs": {"enable_thinking": False}}
+        assert config.max_tokens == 4096
+        assert config.timeout_seconds == 45.5
+        assert config.concurrency_limit == 3
 
     def test_model_config_creation_with_minimal_fields(self):
         """Test ModelConfig creation with only required fields."""
@@ -326,6 +334,10 @@ def test_model_config_creation_with_minimal_fields(self):
         assert config.top_p == 0.95
         assert config.ssl_verify is True
         assert config.model_factory is None
+        assert config.extra_body is None
+        assert config.max_tokens is None
+        assert config.timeout_seconds is None
+        assert config.concurrency_limit is None
 
     def test_model_config_defaults(self):
         """Test ModelConfig has correct default values."""
diff --git a/test/sdk/core/agents/test_context_component.py b/test/sdk/core/agents/test_context_component.py
@@ -418,15 +418,18 @@ def test_to_messages_empty(self):
 
     def test_add_skill(self):
         comp = agent_model_module.SkillsComponent()
-        comp.add_skill("python_coding", "Write Python code", ["example1", "example2"])
+        comp.add_skill("python_coding", "Write Python code")
         assert len(comp.skills) == 1
         assert comp.skills[0]["name"] == "python_coding"
-        assert comp.skills[0]["examples"] == ["example1", "example2"]
+        assert comp.skills[0]["description"] == "Write Python code"
 
     def test_add_skill_without_examples(self):
         comp = agent_model_module.SkillsComponent()
         comp.add_skill("skill_name", "skill desc")
-        assert comp.skills[0]["examples"] == []
+        assert comp.skills[0] == {
+            "name": "skill_name",
+            "description": "skill desc",
+        }
 
 
 class TestMemoryComponent: