Building-RAG-System-with-Deepseek-R1-Locally/main.py at main · ajitsingh98/Building-RAG-System-with-Deepseek-R1-Locally · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
# Imports

from langchain_core.globals import set_verbose, set_debug
from langchain_ollama import ChatOllama, OllamaEmbeddings
from langchain.schema.output_parser import StrOutputParser
from langchain_community.vectorstores import Chroma
from langchain_community.document_loaders import PyPDFLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.schema.runnable import RunnablePassthrough
from langchain_community.vectorstores.utils import filter_complex_metadata
from langchain_core.prompts import ChatPromptTemplate
import logging

set_debug(True)
set_verbose(True)

logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

class ChatPDFProcessor:
    """
    Class for processing PDF documents and enabling question-answering using an LLM model.
    """

    def __init__(self, llm_model: str = 'deepseek-r1:latest', embedding_model: str = 'mxbai-embed-large'):
        """
        Initializes the ChatPDFProcessor with the provided LLM and embedding models.

        Args:
        - llm_model (str): LLM model for question answering.
        - embedding_model (str): Embedding model for document processing.
        """
        self.llm_model = ChatOllama(model=llm_model)
        self.embedding_model = OllamaEmbeddings(model=embedding_model)
        self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024, chunk_overlap=100)
        self.prompt_template = ChatPromptTemplate.from_template(
            """
            You are a helpful assistant answering questions based on the uploaded document.
            Context:
            {context}

            Question:
            {question}

            Answer concisely and accurately in three sentences or less.
            """
        )
        self.vector_store = None
        self.retriever = None

    def ingest_pdf(self, pdf_file_path: str):
        """
        Ingests a PDF document, processes it into embeddings, and stores it in a vector store.

        Args:
        - pdf_file_path (str): Path to the PDF document to ingest.
        """
        logger.info(f"Starting ingestion for file: {pdf_file_path}")
        documents = PyPDFLoader(file_path=pdf_file_path).load()
        chunks = self.text_splitter.split_documents(documents)
        chunks = filter_complex_metadata(chunks)

        self.vector_store = Chroma.from_documents(
            documents=chunks,
            embedding=self.embedding_model,
            persist_directory="chroma_db",
        )
        logger.info("Ingestion completed. Document embeddings stored successfully.")

    def query_document(self, query: str, k: int = 5, score_threshold: float = 0.2):
        """
        Queries the ingested document and retrieves relevant context using the vector store.

        Args:
        - query (str): The question to ask.
        - k (int): The number of relevant documents to retrieve (default is 5).
        - score_threshold (float): The minimum similarity score to consider for retrieved documents (default is 0.2).

        Returns:
        - str: The LLM-generated answer or a message if no relevant context is found.
        """
        if not self.vector_store:
            raise ValueError("No vector store found. Please ingest a document first.")

        if not self.retriever:
            self.retriever = self.vector_store.as_retriever(
                search_type='similarity_score_threshold',
                search_kwargs={"k": k, "score_threshold": score_threshold},
            )

        logger.info(f"Retrieving context for query: {query}")
        retrieved_docs = self.retriever.invoke(query)
        if not retrieved_docs:
            return "No relevant context found in the document to answer your question."

        formatted_input = {
            "context": "\n\n".join(doc.page_content for doc in retrieved_docs),
            "question": query,
        }

        chain = (
            RunnablePassthrough()
            | self.prompt_template
            | self.llm_model
            | StrOutputParser()
        )
        logger.info("Generating response using the LLM.")
        return chain.invoke(formatted_input)

    def clear_data(self):
        """
        Clears the vector store and retriever to reset the system.
        """
        logger.info("Clearing vector store and retriever.")
        self.vector_store = None
        self.retriever = None