Merge pull request #133 from snexus/feature/mcp

snexus · web-flow · commit f0def2cf57a8 · 2025-06-01T17:37:44.000+08:00
Add a quickfix for protobuf incompatibility with chroma. Add 'simple_answer' mcp endpoin
diff --git a/.gitignore b/.gitignore
@@ -17,6 +17,7 @@ temp_data/
 sample_templates/obsidian_conf_test.yaml
 sample_templates/test-templates/*
 .venv2
+.github/prompts
 
 # Distribution / packaging
 .Python
diff --git a/README.md b/README.md
@@ -58,7 +58,7 @@ Interaction with the package is supported through the built-in frontend, or by e
     * Simple web interfaces.
     * Deep linking into document sections - jump to an individual PDF page or a header in a markdown file.
     * Ability to save responses to an offline database for future analysis.
-    * FastAPI based API + MCP server, allo
+    * FastAPI based API + MCP server, allowing communicating with RAG via any mcp client, including VSCode/Windsurf/Cursor and others.
 
 
 ## Demo
diff --git a/sample_templates/obsidian_conf.yaml b/sample_templates/obsidian_conf.yaml
@@ -60,8 +60,8 @@ semantic_search:
   multiquery:
     enabled: False
   conversation_history_settings:
-    enabled: True
-    rewrite_query: True
+    enabled: False
+    rewrite_query: False
     max_history_length: 2
 
 
diff --git a/src/llmsearch/api.py b/src/llmsearch/api.py
@@ -1,6 +1,10 @@
 """FastAPI server for LLMSearch."""
 
 import os
+
+# This is a temporary solution due to incompatimbility of ChromaDB with latest version of Protobuf
+os.environ["PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION"] = "python"
+
 from functools import lru_cache
 from typing import Any, List
 
@@ -24,7 +28,7 @@
 
 
 load_dotenv()
-langchain.debug = True  # Enable debug mode for langchain # type: ignore
+langchain.debug = False
 
 
 # Load the configuration
@@ -101,7 +105,7 @@ def get_llm_bundle_cached() -> LLMBundle:
     description="pyLLMSearch MCP Server",
     describe_all_responses=True,  # Include all possible response schemas
     describe_full_response_schema=True,  # Include full JSON schema in descriptions
-    include_operations=["rag_retrieve_chunks", "rag_generate_answer"],
+    include_operations=["rag_retrieve_chunks", "rag_generate_answer", "rag_generate_answer_simple"],
 )
 
 
@@ -145,6 +149,26 @@ async def llmsearch(
     )
     return output.model_dump()
 
+@api_app.get("/rag", operation_id="rag_generate_answer_simple")
+async def llmsearch_simple(
+    question: str,
+    label: str = "",
+    llm_bundle: LLMBundle = Depends(get_llm_bundle_cached),
+) -> str:
+    """Retrieves answer to the question from the embedded documents, using semantic search."""
+    if label and (label not in get_config().embeddings.labels):
+        raise HTTPException(
+            status_code=404,
+            detail=f"Label '{label}' doesn't exist. Use GET /labels to get a list of labels.",
+        )
+
+    output = get_and_parse_response(
+        query=question,
+        llm_bundle=llm_bundle,
+        config=get_config(),
+        label=label,
+    )
+    return output.response
 
 @api_app.get("/semantic/{question}", operation_id="rag_retrieve_chunks")
 async def semanticsearch(question: str):
diff --git a/src/llmsearch/cli.py b/src/llmsearch/cli.py
@@ -1,5 +1,8 @@
 import os
 
+# This is a temporary solution due to incompatimbility of ChromaDB with latest version of Protobuf
+os.environ["PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION"] = "python"
+
 import click
 import streamlit.web.cli
 from loguru import logger