raminmohammadi
diff --git a/‎clean_env.sh‎
Lines changed: 18 additions & 0 deletions b/‎clean_env.sh‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎frontend/package-lock.json‎
Lines changed: 34 additions & 1 deletion b/‎frontend/package-lock.json‎
Lines changed: 34 additions & 1 deletion
diff --git a/‎frontend/package.json‎
Lines changed: 3 additions & 1 deletion b/‎frontend/package.json‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎langchain_ai_agent/agents/chat_agent.py‎
Lines changed: 130 additions & 0 deletions b/‎langchain_ai_agent/agents/chat_agent.py‎
Lines changed: 130 additions & 0 deletions
diff --git a/‎langchain_ai_agent/api/query_api.py‎
Lines changed: 23 additions & 5 deletions b/‎langchain_ai_agent/api/query_api.py‎
Lines changed: 23 additions & 5 deletions
diff --git a/‎langchain_ai_agent/config/ingestion_config.yml‎
Lines changed: 2 additions & 1 deletion b/‎langchain_ai_agent/config/ingestion_config.yml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎langchain_ai_agent/ingestion/reader.py‎
Lines changed: 1 addition & 1 deletion b/‎langchain_ai_agent/ingestion/reader.py‎
Lines changed: 1 addition & 1 deletion
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+echo "🧹 Cleaning environment..."
+
+# Remove virtual environment
+rm -rf .venv
+rm -rf build/
+rm -rf dist/
+
+# Remove Python cache
+find . -name '*.pyc' -delete
+find . -type d -name '__pycache__' -exec rm -rf {} +
+pip cache purge
+
+# Remove test and mypy caches
+rm -rf __pycache__ .pytest_cache .mypy_cache
+
+echo "✅ Clean complete."
@@ -13,12 +13,14 @@
         "clsx": "^2.0.0",
         "lucide-react": "^0.293.0",
         "next": "^14.2.28",
+        "next-themes": "^0.4.6",
         "postcss": "^8.4.24",
         "radix-ui": "^1.0.0",
         "react": "18.2.0",
         "react-dom": "18.2.0",
         "shadcn-ui": "^0.9.0",
-        "tailwindcss": "^3.4.1"
+        "tailwindcss": "^3.4.1",
+        "tailwindcss-animate": "^1.0.7"
     },
     "devDependencies": {
         "@types/node": "22.14.0",
 
@@ -0,0 +1,130 @@
+from langchain.chains import (
+    create_history_aware_retriever,
+)
+from langchain.chains.combine_documents import create_stuff_documents_chain
+from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain_google_vertexai import ChatVertexAI
+from langchain_ai_agent.retriever.vector_store import DocumentEmbedder
+from langchain_core.runnables import RunnableLambda, RunnableMap
+
+# LangGraph memory imports
+from langgraph.checkpoint.memory import MemorySaver
+from langchain.prompts import PromptTemplate
+from langgraph.graph import START, END, StateGraph
+from langchain_core.messages import AIMessage, HumanMessage
+from typing import TypedDict, Annotated, Sequence
+import operator
+import logging
+
+# Configure logging
+logger = logging.getLogger(__name__)
+logging.basicConfig(level=logging.INFO)
+
+class AgentState(TypedDict):
+    messages: Annotated[Sequence[HumanMessage | AIMessage], operator.add]
+    question: str
+    graph_output: str
+
+
+def get_chat_agent_with_memory(persist_dir: str):
+    """
+    Creates and returns an agent that maintains persistent conversation memory.
+    The agent is invoked using .ainvoke({"question": ...}, config={"configurable": {"thread_id": ...}})
+    """
+    embedder = DocumentEmbedder(persist_dir=persist_dir)
+    retriever = embedder.get_retriever(k=10)
+
+    llm = ChatVertexAI(
+        model_name="gemini-2.0-flash-lite",
+        temperature=0.3,
+        max_output_tokens=1024,
+    )
+
+    contextualize_q_system_prompt = (
+        "Given a chat history and the latest user question "
+        "which might reference context in the chat history, "
+        "formulate a standalone question that can be understood "
+        "without the chat history. Do NOT answer the question; just "
+        "reformulate it if needed and otherwise return it as is."
+    )
+    contextualize_q_prompt = ChatPromptTemplate.from_messages(
+        [
+            ("system", contextualize_q_system_prompt),
+            MessagesPlaceholder(variable_name="chat_history"),
+            ("human", "{input}"),
+        ]
+    )
+
+    try:
+        history_aware_retriever = create_history_aware_retriever(
+            llm, retriever, contextualize_q_prompt
+        )
+    except Exception as e:
+        logger.info(f"[Retriever] {e}")
+
+    qa_system_prompt = (
+        "You are an assistant for question-answering tasks. Use the following "
+        "pieces of retrieved context to answer the question. If you don't know "
+        "the answer, just say that you don't know. Use three sentences maximum and "
+        "keep the answer concise."
+    )
+
+    stuff_prompt = PromptTemplate(
+        template="""You are an assistant for question-answering tasks. 
+        Use the following pieces of context to answer the question. If you don't know the answer, just say that you don't know.
+        Context:
+        {context}
+        Question:
+        {question}
+        Answer:""",
+        input_variables=["context", "question"]
+    )
+
+    try:
+        combine_docs_chain = create_stuff_documents_chain(llm, stuff_prompt)
+    except Exception as e:
+        logger.info(f"[Chain] {e}")
+
+    retrieval_chain = RunnableMap({
+                        "context": lambda x: retriever.invoke(x["input"]),
+                        "question": lambda x: x["input"]
+                    }) | combine_docs_chain
+
+
+    graph_builder = StateGraph(AgentState)
+
+    def call_model(state: AgentState) -> dict:
+        logger.info(f"[call_model] Full state: {state}")
+        question = state.get("question", "")
+        logger.info(f"[call_model] Extracted question: {question}")
+
+        if not question:
+            return {
+                "messages": [AIMessage(content="[call_model] Empty or missing question.")],
+                "graph_output": "[call_model] Empty or missing question."
+            }
+
+        chat_history = state.get("messages", [])
+
+        chain_input = {
+            "input": question,
+            "chat_history": chat_history
+        }
+
+        chain_output = retrieval_chain.invoke(chain_input)
+        answer_text = chain_output
+
+        logger.info(f"[Agent] Response: {answer_text}")
+
+        return {
+            "messages": [AIMessage(content=answer_text or "[call_model] No answer generated.")],
+            "graph_output": answer_text or "[call_model] No answer generated."
+        }
+
+    graph_builder.add_node("model", call_model)
+    graph_builder.set_entry_point("model")
+    graph_builder.add_edge("model", END)
+
+    memory = MemorySaver()
+    app = graph_builder.compile(checkpointer=memory)
+    return app
@@ -1,13 +1,31 @@
 from fastapi import APIRouter, Query, HTTPException
-from langchain_ai_agent.retriever.vector_store import DocumentEmbedder
+from fastapi.responses import StreamingResponse
+from langchain_ai_agent.agents.chat_agent import get_chat_agent_with_memory
+import traceback, logging
+from fastapi.responses import JSONResponse
+
+logger = logging.getLogger(__name__)
+logging.basicConfig(level=logging.INFO)
 
 router = APIRouter()
 
 @router.get("/api/query")
-def query_kb(question: str = Query(...), namespace: str = Query("default")):
+async def query_kb(question: str = Query(...), namespace: str = Query("default")):
     try:
-        embedder = DocumentEmbedder(persist_dir=f"faiss_index/{namespace}")
-        docs = embedder.query(question)
-        return {"results": [doc.page_content for doc in docs]}
+        agent = get_chat_agent_with_memory(persist_dir=f"faiss_index/{namespace}")
+        result = await agent.ainvoke(
+            {"question": question},
+            config={"configurable": {"thread_id": "query-session"}}
+        )
+
+        answer = result.get("graph_output", "").strip()
+        if not answer:
+            raise HTTPException(status_code=500, detail="Agent returned no answer.")
+
+        # ✅ Send response as JSON with a results array
+        return JSONResponse(content={"results": [answer]})
+
     except Exception as e:
+        logger.error(f"Agent execution failed: {e}")
+        logger.error(traceback.format_exc())
         raise HTTPException(status_code=500, detail=str(e))
@@ -4,4 +4,5 @@ supported_extensions:
   - .pdf
   - .docx
   - .txt
-  - .eml
+  - .eml
+  - .html
@@ -16,7 +16,7 @@ def __init__(self, config_path: str = "config/ingestion_config.yaml"):
         self.config = self._load_config(config_path)
         self.chunk_size = self.config.get("chunk_size", 500)
         self.chunk_overlap = self.config.get("chunk_overlap", 50)
-        self.supported_extensions = set(self.config.get("supported_extensions", [".pdf", ".docx", ".txt", ".eml"]))
+        self.supported_extensions = set(self.config.get("supported_extensions", [".pdf", ".docx", ".txt", ".eml", ".html"]))
         self.text_splitter = RecursiveCharacterTextSplitter(
             chunk_size=self.chunk_size,
             chunk_overlap=self.chunk_overlap
-Original file line number
+Diff line change
   - .pdf
   - .docx
   - .txt
 -  - .eml
 +  - .eml
 +  - .html