Digital_Detectives_RAG_System

Running

App Files Files Community

Tesneem commited on 2 days ago

Commit

d1c2df0

•

1 Parent(s): d53e8b2

Create app.py

Browse files

Files changed (1) hide show

app.py +439 -0

app.py ADDED Viewed

	@@ -0,0 +1,439 @@

+#############################################################################################################################
+# Filename   : app.py
+# Description: A Streamlit application to showcase how RAG works.
+# Author     : Georgios Ioannou
+#
+# Copyright © 2024 by Georgios Ioannou
+#############################################################################################################################
+# Import libraries.
+import os
+import streamlit as st
+from dotenv import load_dotenv, find_dotenv
+from huggingface_hub import InferenceClient
+from langchain.prompts import PromptTemplate
+from langchain.schema import Document
+from langchain.schema.runnable import RunnablePassthrough, RunnableLambda
+from langchain_community.embeddings import HuggingFaceInferenceAPIEmbeddings
+from langchain_community.vectorstores import MongoDBAtlasVectorSearch
+from pymongo import MongoClient
+from pymongo.collection import Collection
+from typing import Dict, Any
+#############################################################################################################################
+class RAGQuestionAnswering:
+    def __init__(self):
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Initializes the RAG Question Answering system by setting up configuration
+        and loading environment variables.
+        Assumptions
+        -----------
+        - Expects .env file with MONGO_URI and HF_TOKEN
+        - Requires proper MongoDB setup with vector search index
+        - Needs connection to Hugging Face API
+        Notes
+        -----
+        This is the main class that handles all RAG operations
+        """
+        self.load_environment()
+        self.setup_mongodb()
+        self.setup_embedding_model()
+        self.setup_vector_search()
+        self.setup_rag_chain()
+    def load_environment(self) -> None:
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Loads environment variables from .env file and sets up configuration constants.
+        Assumptions
+        -----------
+        Expects a .env file with MONGO_URI and HF_TOKEN defined
+        Notes
+        -----
+        Will stop the application if required environment variables are missing
+        """
+        load_dotenv(find_dotenv())
+        self.MONGO_URI = os.getenv("MONGO_URI")
+        self.HF_TOKEN = os.getenv("HF_TOKEN")
+        if not self.MONGO_URI or not self.HF_TOKEN:
+            st.error("Please ensure MONGO_URI and HF_TOKEN are set in your .env file")
+            st.stop()
+        # MongoDB configuration.
+        self.DB_NAME = "txts"
+        self.COLLECTION_NAME = "txts_collection"
+        self.VECTOR_SEARCH_INDEX = "vector_index"
+    def setup_mongodb(self) -> None:
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Initializes the MongoDB connection and sets up the collection.
+        Assumptions
+        -----------
+        - Valid MongoDB URI is available
+        - Database and collection exist in MongoDB Atlas
+        Notes
+        -----
+        Uses st.cache_resource for efficient connection management
+        """
+        @st.cache_resource
+        def init_mongodb() -> Collection:
+            cluster = MongoClient(self.MONGO_URI)
+            return cluster[self.DB_NAME][self.COLLECTION_NAME]
+        self.mongodb_collection = init_mongodb()
+    def setup_embedding_model(self) -> None:
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Initializes the embedding model for vector search.
+        Assumptions
+        -----------
+        - Valid Hugging Face API token
+        - Internet connection to access the model
+        Notes
+        -----
+        Uses the all-mpnet-base-v2 model from sentence-transformers
+        """
+        @st.cache_resource
+        def init_embedding_model() -> HuggingFaceInferenceAPIEmbeddings:
+            return HuggingFaceInferenceAPIEmbeddings(
+                api_key=self.HF_TOKEN,
+                model_name="sentence-transformers/all-mpnet-base-v2",
+            )
+        self.embedding_model = init_embedding_model()
+    def setup_vector_search(self) -> None:
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Sets up the vector search functionality using MongoDB Atlas.
+        Assumptions
+        -----------
+        - MongoDB Atlas vector search index is properly configured
+        - Valid embedding model is initialized
+        Notes
+        -----
+        Creates a retriever with similarity search and score threshold
+        """
+        @st.cache_resource
+        def init_vector_search() -> MongoDBAtlasVectorSearch:
+            return MongoDBAtlasVectorSearch.from_connection_string(
+                connection_string=self.MONGO_URI,
+                namespace=f"{self.DB_NAME}.{self.COLLECTION_NAME}",
+                embedding=self.embedding_model,
+                index_name=self.VECTOR_SEARCH_INDEX,
+            )
+        self.vector_search = init_vector_search()
+        self.retriever = self.vector_search.as_retriever(
+            search_type="similarity", search_kwargs={"k": 10, "score_threshold": 0.85}
+        )
+    def format_docs(self, docs: list[Document]) -> str:
+        """
+        Parameters
+        ----------
+        **docs:** list[Document] - List of documents to be formatted
+        Output
+        ------
+        str: Formatted string containing concatenated document content
+        Purpose
+        -------
+        Formats the retrieved documents into a single string for processing
+        Assumptions
+        -----------
+        Documents have page_content attribute
+        Notes
+        -----
+        Joins documents with double newlines for better readability
+        """
+        return "\n\n".join(doc.page_content for doc in docs)
+    def generate_response(self, input_dict: Dict[str, Any]) -> str:
+        """
+        Parameters
+        ----------
+        **input_dict:** Dict[str, Any] - Dictionary containing context and question
+        Output
+        ------
+        str: Generated response from the model
+        Purpose
+        -------
+        Generates a response using the Hugging Face model based on context and question
+        Assumptions
+        -----------
+        - Valid Hugging Face API token
+        - Input dictionary contains 'context' and 'question' keys
+        Notes
+        -----
+        Uses Qwen2.5-1.5B-Instruct model with controlled temperature
+        """
+        hf_client = InferenceClient(api_key=self.HF_TOKEN)
+        formatted_prompt = self.prompt.format(**input_dict)
+        response = hf_client.chat.completions.create(
+            model="Qwen/Qwen2.5-1.5B-Instruct",
+            messages=[
+                {"role": "system", "content": formatted_prompt},
+                {"role": "user", "content": input_dict["question"]},
+            ],
+            max_tokens=1000,
+            temperature=0.2,
+        )
+        return response.choices[0].message.content
+    def setup_rag_chain(self) -> None:
+        """
+        Parameters
+        ----------
+        None
+        Output
+        ------
+        None
+        Purpose
+        -------
+        Sets up the RAG chain for processing questions and generating answers
+        Assumptions
+        -----------
+        Retriever and response generator are properly initialized
+        Notes
+        -----
+        Creates a chain that combines retrieval and response generation
+        """
+        self.prompt = PromptTemplate.from_template(
+            """Use the following pieces of context to answer the question at the end.
+            START OF CONTEXT:
+            {context}
+            END OF CONTEXT:
+            START OF QUESTION:
+            {question}
+            END OF QUESTION:
+            If you do not know the answer, just say that you do not know.
+            NEVER assume things.
+            """
+        )
+        self.rag_chain = {
+            "context": self.retriever | RunnableLambda(self.format_docs),
+            "question": RunnablePassthrough(),
+        } | RunnableLambda(self.generate_response)
+    def process_question(self, question: str) -> str:
+        """
+        Parameters
+        ----------
+        **question:** str - The user's question to be answered
+        Output
+        ------
+        str: The generated answer to the question
+        Purpose
+        -------
+        Processes a user question through the RAG chain and returns an answer
+        Assumptions
+        -----------
+        - Question is a non-empty string
+        - RAG chain is properly initialized
+        Notes
+        -----
+        Main interface for question-answering functionality
+        """
+        return self.rag_chain.invoke(question)
+#############################################################################################################################
+def setup_streamlit_ui() -> None:
+    """
+    Parameters
+    ----------
+    None
+    Output
+    ------
+    None
+    Purpose
+    -------
+    Sets up the Streamlit user interface with proper styling and layout
+    Assumptions
+    -----------
+    - CSS file exists at ./static/styles/style.css
+    - Image file exists at ./static/images/ctp.png
+    Notes
+    -----
+    Handles all UI-related setup and styling
+    """
+    st.set_page_config(page_title="RAG Question Answering", page_icon="🤖")
+    # Load CSS.
+    with open("./static/styles/style.css") as f:
+        st.markdown(f"<style>{f.read()}</style>", unsafe_allow_html=True)
+    # Title and subtitles.
+    st.markdown(
+        '<h1 align="center" style="font-family: monospace; font-size: 2.1rem; margin-top: -4rem">RAG Question Answering</h1>',
+        unsafe_allow_html=True,
+    )
+    st.markdown(
+        '<h3 align="center" style="font-family: monospace; font-size: 1.5rem; margin-top: -2rem">Using Zoom Closed Captioning From The Lectures</h3>',
+        unsafe_allow_html=True,
+    )
+    st.markdown(
+        '<h2 align="center" style="font-family: monospace; font-size: 1.5rem; margin-top: 0rem">CUNY Tech Prep Tutorial 5</h2>',
+        unsafe_allow_html=True,
+    )
+    # Display logo.
+    left_co, cent_co, last_co = st.columns(3)
+    with cent_co:
+        st.image("./static/images/ctp.png")
+#############################################################################################################################
+def main():
+    """
+    Parameters
+    ----------
+    None
+    Output
+    ------
+    None
+    Purpose
+    -------
+    Main function that runs the Streamlit application
+    Assumptions
+    -----------
+    All required environment variables and files are present
+    Notes
+    -----
+    Entry point for the application
+    """
+    # Setup UI.
+    setup_streamlit_ui()
+    # Initialize RAG system.
+    rag_system = RAGQuestionAnswering()
+    # Create input elements.
+    query = st.text_input("Question:", key="question_input")
+    # Handle submission.
+    if st.button("Submit", type="primary"):
+        if query:
+            with st.spinner("Generating response..."):
+                response = rag_system.process_question(query)
+                st.text_area("Answer:", value=response, height=200, disabled=True)
+        else:
+            st.warning("Please enter a question.")
+    # Add GitHub link.
+    st.markdown(
+        """
+        <p align="center" style="font-family: monospace; color: #FAF9F6; font-size: 1rem;">
+        <b>Check out our <a href="https://github.com/GeorgiosIoannouCoder/" style="color: #FAF9F6;">GitHub repository</a></b>
+        </p>
+        """,
+        unsafe_allow_html=True,
+    )
+#############################################################################################################################
+if __name__ == "__main__":
+    main()