File size: 3,647 Bytes
ddca922 9230fc6 ddca922 41a2f7d ddca922 7940f63 ddca922 8a3a338 ddca922 8a3a338 ddca922 e40a5fc |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 |
from langchain_community.document_loaders import PyMuPDFLoader
from langchain_text_splitters import RecursiveCharacterTextSplitter
from langchain_openai import AzureOpenAIEmbeddings, AzureChatOpenAI, OpenAIEmbeddings, ChatOpenAI
from operator import itemgetter
from langchain_core.runnables import RunnablePassthrough
from langchain_qdrant import QdrantVectorStore
from qdrant_client import QdrantClient
from qdrant_client.http.models import Distance, VectorParams
from langchain.prompts import ChatPromptTemplate
import tiktoken
import os
from dotenv import load_dotenv
# Load environment variables from .env file
def tiktoken_len(text):
tokens = tiktoken.encoding_for_model("gpt-4o").encode(
return len(tokens)
def setup_vector_db():
# Get the directory of the current file
current_file_directory = os.path.dirname(os.path.abspath(__file__))
# Change the working directory to the current file's directory
# Load the NIST AI document
PDF_LINK = "data/nist_ai.pdf"
loader = PyMuPDFLoader(file_path=PDF_LINK)
nist_doc = loader.load()
text_splitter = RecursiveCharacterTextSplitter(
chunk_size = 500,
chunk_overlap = 100,
length_function = tiktoken_len,
nist_chunks = text_splitter.split_documents(nist_doc)
embeddings_small = AzureOpenAIEmbeddings(azure_deployment="text-embedding-3-small")
# embeddings_small = OpenAIEmbeddings(model="text-embedding-3-small")
qdrant_client = QdrantClient(":memory:") # set Qdrant DB and its location (in-memory)
vectors_config=VectorParams(size=1536, distance=Distance.COSINE),
qdrant_vector_store = QdrantVectorStore(
) # create a QdrantVectorStore object with the above specified client, collection name, and embedding model.
qdrant_vector_store.add_documents(nist_chunks) # add the documents to the QdrantVectorStore
retriever = qdrant_vector_store.as_retriever()
return retriever
# define a global variable to store the retriever object
retriever = setup_vector_db()
qa_gpt4_llm = AzureChatOpenAI(azure_deployment="gpt-4o-mini", temperature=0) # GPT-4o-mini model
# qa_gpt4_llm = ChatOpenAI(model="gpt-4o-mini", temperature=0) # GPT-4o-mini model
# define a template for the RAG model
rag_template = """
You are a helpful assistant that helps users find information and answer their question.
You MUST use ONLY the available context to answer the question.
If necessary information to answer the question cannot be found in the provided context, you MUST "I don't know."
# create rag prompt object from the template
prompt = ChatPromptTemplate.from_template(rag_template)
# update the chain with LLM, prompt, and question variable.
retrieval_augmented_qa_chain = (
{"context": itemgetter("question") | retriever, "question": itemgetter("question")}
| RunnablePassthrough.assign(context=itemgetter("context"))
| {"response": prompt | qa_gpt4_llm, "context": itemgetter("context"), "question": itemgetter("question")}
def get_response(query, history):
"""A helper function to get the response from the RAG model and return it to the UI."""
response = retrieval_augmented_qa_chain.invoke({"question" : query})
return response["response"].content |