Spaces:

Mr-Cool
/

AIE4_midterm_project

Sleeping

App Files Files Community

Mr-Cool commited on Sep 26, 2024

Commit

e40a5fc

verified ·

1 Parent(s): f3a602e

Added files

Browse files

Files changed (5) hide show

.gitattributes +1 -0
app.py +7 -0
data/nist_ai.pdf +3 -0
functions.py +97 -0
requirements.txt +9 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+data/nist_ai.pdf filter=lfs diff=lfs merge=lfs -text

app.py ADDED Viewed

	@@ -0,0 +1,7 @@

+import gradio as gr
+from functions import *
+rag_poc = gr.ChatInterface(get_response)
+if __name__ == "__main__":
+    rag_poc.launch()

data/nist_ai.pdf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b98f5f456157e2de607322a9a2630175f93683754a455c469c0954e4e94a1b1c
+size 1204825

functions.py ADDED Viewed

	@@ -0,0 +1,97 @@

+from langchain_community.document_loaders import PyMuPDFLoader
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain_openai import AzureOpenAIEmbeddings, AzureChatOpenAI
+from operator import itemgetter
+from langchain_core.runnables import RunnablePassthrough
+from langchain_qdrant import QdrantVectorStore
+from qdrant_client import QdrantClient
+from qdrant_client.http.models import Distance, VectorParams
+from langchain.prompts import ChatPromptTemplate
+import tiktoken
+import os
+### SETUP FUNCTIONS ###
+def tiktoken_len(text):
+    tokens = tiktoken.encoding_for_model("gpt-4o").encode(
+        text,
+    )
+    return len(tokens)
+def setup_vector_db():
+    # Get the directory of the current file
+    current_file_directory = os.path.dirname(os.path.abspath(__file__))
+    # Change the working directory to the current file's directory
+    os.chdir(current_file_directory)
+    # Load the NIST AI document
+    PDF_LINK = "data/nist_ai.pdf"
+    loader = PyMuPDFLoader(file_path=PDF_LINK)
+    nist_doc = loader.load()
+    text_splitter = RecursiveCharacterTextSplitter(
+        chunk_size = 500,
+        chunk_overlap = 100,
+        length_function = tiktoken_len,
+    )
+    nist_chunks = text_splitter.split_documents(nist_doc)
+    embeddings_small = AzureOpenAIEmbeddings(azure_deployment="text-embedding-3-small")
+    qdrant_client = QdrantClient(":memory:") # set Qdrant DB and its location (in-memory)
+    qdrant_client.create_collection(
+        collection_name="NIST_AI",
+        vectors_config=VectorParams(size=1536, distance=Distance.COSINE),
+    )
+    qdrant_vector_store = QdrantVectorStore(
+        client=qdrant_client,
+        collection_name="NIST_AI",
+        embedding=embeddings_small,
+    ) # create a QdrantVectorStore object with the above specified client, collection name, and embedding model.
+    qdrant_vector_store.add_documents(nist_chunks) # add the documents to the QdrantVectorStore
+    retriever = qdrant_vector_store.as_retriever()
+    return retriever
+### VARIABLES ###
+# define a global variable to store the retriever object
+retriever = setup_vector_db()
+qa_gpt4_llm = AzureChatOpenAI(azure_deployment="gpt-4", temperature=0) # GPT-4o model
+# define a template for the RAG model
+rag_template = """
+You are a helpful assistant that helps users find information and answer their question.
+You MUST use ONLY the available context to answer the question.
+If necessary information to answer the question cannot be found in the provided context, you MUST "I don't know."
+Question:
+{question}
+Context:
+{context}
+"""
+# create rag prompt object from the template
+prompt = ChatPromptTemplate.from_template(rag_template)
+# update the chain with LLM, prompt, and question variable.
+retrieval_augmented_qa_chain = (
+    {"context": itemgetter("question") | retriever, "question": itemgetter("question")}
+    | RunnablePassthrough.assign(context=itemgetter("context"))
+    | {"response": prompt | qa_gpt4_llm, "context": itemgetter("context"), "question": itemgetter("question")}
+)
+### FUNCTIONS ###
+def get_response(query, history):
+    """A helper function to get the response from the RAG model and return it to the UI."""
+    response = retrieval_augmented_qa_chain.invoke({"question" : query})
+    return response["response"].content

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+langchain-community
+gradio
+langchain-openai
+langchain
+qdrant-client
+tiktoken
+langchain-qdrant
+PyMuPDF
+langchain_core