Spaces:

SalehAhmad
/

Wagner

Runtime error

App Files Files Community

SalehAhmad commited on Oct 4, 2024

Commit

98186e3

verified ·

1 Parent(s): 74fbcab

Upload 7 files

Browse files

Files changed (4) hide show

PRESET_QUERIES.py +24 -0
app.ipynb +224 -0
chatbot.py +90 -61
data_query.py +26 -9

PRESET_QUERIES.py ADDED Viewed

	@@ -0,0 +1,24 @@

+Queries = {
+    'Who are you?': [
+        'Who is Wagner Chatbot?',
+        'Tell me about Wagner?',
+        'Who is Wagner AI?'
+    ],
+    'who is Daniel Ringel?': [
+        'Tell me about Daniel Ringel',
+        'Can you show Daniel Ringel\'s CV?',
+        'Who is Daniel R.?'
+    ],
+}
+# Each query will map to a document
+Query_Doc_Map = {
+    'Who are you?': [
+        'Who-is-Wagner-Chatbot-Response.docx'
+    ],
+    'who is Daniel Ringel?': [
+        'CV/Ringel_Daniel_CV_V1.docx'
+    ]
+}

app.ipynb ADDED Viewed

	@@ -0,0 +1,224 @@

+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Importing All Required Packages and Libraries"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from chatbot import RAGChatbot\n",
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "load_dotenv()\n",
+    "\n",
+    "import warnings\n",
+    "warnings.filterwarnings(\"ignore\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Initializing the RAG chatbot"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "chatbot = RAGChatbot(\n",
+    "    pinecone_api_key=os.getenv('PINECONE_API_KEY'),\n",
+    "    index_name='test',\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Below cell has code to ingest data into the pinecone vector database\n",
+    "## Note: Only uncomment and run when you have to really ingest the data from the Data directory (which has all the relavant files)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# chatbot.ingest_data('../../Data', empty=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Below cell is used to query the RAG chatbot\n",
+    "## You can test the responses for different values of \n",
+    "- k: The number of documents to retrieve from the vector database. You can input any natural number >= 1\n",
+    "- rerank: Whether to rerank the retrieved documents or not. Possible inputs are true and false"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# response = chatbot.query_chatbot(input(), k=15, rerank=True) #the input() will ask you to enter the query\n",
+    "# print(response['response'])\n",
+    "\n",
+    "# reranked_docs = response['context_docs']\n",
+    "# for docs in reranked_docs:\n",
+    "#     print(docs.metadata)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "prompts = [\n",
+    "    'Who is daniel?',\n",
+    "    'Who are you?',\n",
+    "    'What is your name?',\n",
+    "    'What is your job?',\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Response from routing:query_text: who is daniel? - best_match query: who is Daniel Ringel? - Doc: CV/Ringel_Daniel_CV_V1.docx\n",
+      "Daniel M. Ringel is an Assistant Professor of Marketing for Data Science and AI at the Kenan-Flagler Business School, University of North Carolina at Chapel Hill. His research focuses on integrating marketing theory with artificial intelligence and machine learning to develop frameworks and tools that benefit both academic discussions and practical applications. Daniel's work includes mapping market structure dynamics, understanding competitive relationships using AI, and advancing data-driven marketing strategies. He has received numerous awards for his contributions to the field and has been actively involved in teaching, research, and industry engagement related to AI in business.\n",
+      "CV/Ringel_Daniel_CV_V1.docx\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "100%|██████████| 1/1 [00:00<00:00, 23.67it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Hello! I am Wagner, an AI assistant named after the character from Goethe's Faust. In the story, Wagner is a loyal assistant to Faust, sharing in his intellectual pursuits on a smaller scale. Similarly, I am dedicated to scholarly endeavors, specifically assisting with Daniel Rangel's research in artificial intelligence and marketing. My role is to provide clear, structured, and accurate information related to Daniel's academic work, including his research, teaching, and career.\n",
+      "{'source': '../../Data/Wagner/Who-is-Wagner-Chatbot-Response.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-Skiera-2016-Visualizing_Asymmetric-Competition_among_More_than_1000_Products_Using_Big_Search_Data.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Website/Ringel-Skiera-2016-Visualizing-Competition-Between-1000-Products-MktSci.pdf'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/5 Working Papers/Malhotra_Ringel_Zhao_Cui_2024_Brand_Alliance_Opportunities.pdf'}\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "100%|██████████| 1/1 [00:00<00:00, 40.62it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Hello! My name is Wagner. I'm an assistant named after the character from Goethe’s Faust, dedicated to assisting with inquiries related to Daniel Rangel’s research in artificial intelligence and marketing.\n",
+      "{'source': '../../Data/Wagner/Who-is-Wagner-Chatbot-Response.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-Skiera-2016-Visualizing_Asymmetric-Competition_among_More_than_1000_Products_Using_Big_Search_Data.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-Skiera-2016-Visualizing_Asymmetric-Competition_among_More_than_1000_Products_Using_Big_Search_Data.docx'}\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "100%|██████████| 1/1 [00:00<00:00, 45.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I am Wagner, a friendly AI assistant dedicated to supporting scholarly endeavors related to Daniel Rangel’s research in artificial intelligence and marketing. My role is to provide clear, structured, and accurate information based on his academic work, including his published and working papers, CV, and research profile. I strive to assist with inquiries related to Daniel’s research, teaching, and career.\n",
+      "{'source': '../../Data/Wagner/Who-is-Wagner-Chatbot-Response.docx'}\n",
+      "{'source': '../../Data/CV/Ringel_Daniel_CV_V1.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-Skiera-2016-Visualizing_Asymmetric-Competition_among_More_than_1000_Products_Using_Big_Search_Data.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Matthe-Ringel-Skiera_2023_Mapping-Market-Structure-Evolution.docx'}\n",
+      "{'source': '../../Data/3 Published Papers/for_Embedding/Ringel-2023-Multimarket_Membership_Mapping.docx'}\n",
+      "{'source': '../../Data/5 Working Papers/Malhotra_Ringel_Zhao_Cui_2024_Brand_Alliance_Opportunities.pdf'}\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "for prompt in prompts:\n",
+    "    response, source = chatbot.query_chatbot(prompt, k=15, rerank=True)\n",
+    "    print(response)\n",
+    "\n",
+    "    if type(source) == str:\n",
+    "        print(source)\n",
+    "    else:\n",
+    "        for docs in source:\n",
+    "            print(docs.metadata)\n",
+    "    print('\\n\\n')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "env",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

chatbot.py CHANGED Viewed

@@ -1,66 +1,30 @@
 import os
-import torch
 import yaml
 from langchain_pinecone import PineconeVectorStore
 from langchain_community.embeddings import HuggingFaceBgeEmbeddings
 from data_ingester import ChatbotDataIngester
 from data_query import ChatbotDataQuery
 from getpass import getpass
 from pinecone import Pinecone, ServerlessSpec
-from ragatouille import RAGPretrainedModel
 import torch.nn.functional as F
 from transformers import AutoModel
-class CustomReranker:
-    def __init__(self, model_name="nvidia/NV-Embed-v2", max_length=32768):
-        """
-        Initialize the reranker with the model and tokenizer.
-        """
-        self.model = AutoModel.from_pretrained(model_name, trust_remote_code=True, device_map="auto")
-        self.max_length = max_length
-    def _encode(self, texts, instruction=""):
-        """
-        Helper function to encode the input texts using the model.
-        """
-        return self.model.encode(texts, instruction=instruction, max_length=self.max_length)
-    def rerank(self, query, passages, k=1):
-        """
-        Rerank the passages based on their similarity with the query.
-        Args:
-        - query (str): The query text.
-        - passages (list of str): List of passages to rerank.
-        - k (int): The number of top-k documents to return after reranking.
-        Returns:
-        - A list of the top-k ranked passages with their similarity scores.
-        """
-        query_prefix = "Instruct: Given a question, retrieve passages that answer the question\nQuery: "
-        passage_prefix = ""
-        # Get the query and passage embeddings
-        query_embeddings = self._encode([query], instruction=query_prefix)
-        passage_embeddings = self._encode(passages, instruction=passage_prefix)
-        # Normalize embeddings
-        query_embeddings = F.normalize(query_embeddings, p=2, dim=1)
-        passage_embeddings = F.normalize(passage_embeddings, p=2, dim=1)
-        # Compute similarity scores
-        scores = (query_embeddings @ passage_embeddings.T) * 100
-        scores = scores.tolist()[0]
-        # Sort passages by their scores
-        sorted_passages = sorted(
-            [{"content": passage, "score": score, "result_index": idx}
-             for idx, (passage, score) in enumerate(zip(passages, scores))],
-            key=lambda x: x['score'], reverse=True
-        )
-        return sorted_passages[:k]  # Return top-k reranked passages
 class RAGChatbot:
     def __init__(self, pinecone_api_key=None, index_name="test-index", config_path="../config.yml"):
@@ -75,7 +39,8 @@ class RAGChatbot:
         self.data_ingester = ChatbotDataIngester(vector_store=self.vector_store, embeddings=self.embeddings)
         self.data_query = ChatbotDataQuery(vector_store=self.vector_store)
         self.reranker = self.initialize_reranker()
-        # self.reranker = CustomReranker()
     def load_config(self, config_path):
         """
@@ -127,19 +92,83 @@ class RAGChatbot:
         """
         self.data_ingester.load_and_ingest(dir_path, empty_db=empty)
     def query_chatbot(self, query_text, k=1, rerank=False): #, fetch_k=2, lambda_mult=0.5
         """
         Query the chatbot using the provided query text and optional search parameters.
         """
-        if rerank:
-            response = self.data_query.query(
-                query_text=query_text,
-                k=k,
-                reranker=self.reranker
-            )
         else:
-            response = self.data_query.query(
-                query_text=query_text,
-                k=k,
-            )
-        return response

 import os
+import numpy as np
 import yaml
+from docx import Document
 from langchain_pinecone import PineconeVectorStore
 from langchain_community.embeddings import HuggingFaceBgeEmbeddings
+from ragatouille import RAGPretrainedModel
 from data_ingester import ChatbotDataIngester
 from data_query import ChatbotDataQuery
 from getpass import getpass
 from pinecone import Pinecone, ServerlessSpec
+import torch
 import torch.nn.functional as F
 from transformers import AutoModel
+from sklearn.metrics.pairwise import cosine_similarity
+from openai import OpenAI
+from PRESET_QUERIES import Queries, Query_Doc_Map
+from data_query import generate_openai_response
+from dotenv import load_dotenv
+load_dotenv()
 class RAGChatbot:
     def __init__(self, pinecone_api_key=None, index_name="test-index", config_path="../config.yml"):
         self.data_ingester = ChatbotDataIngester(vector_store=self.vector_store, embeddings=self.embeddings)
         self.data_query = ChatbotDataQuery(vector_store=self.vector_store)
         self.reranker = self.initialize_reranker()
+        self.openai_api_key = os.getenv("OPENAI_API_KEY")
+        self.client = OpenAI(api_key=self.openai_api_key)
     def load_config(self, config_path):
         """
         """
         self.data_ingester.load_and_ingest(dir_path, empty_db=empty)
+    def __route(self, query_text):
+        query_text = query_text.lower()
+        def cosine_similarity_calc(vec1, vec2):
+            vec1 = np.array(vec1).reshape(1, -1)
+            vec2 = np.array(vec2).reshape(1, -1)
+            return cosine_similarity(vec1, vec2)[0][0]
+        def get_embeddings(client, text):
+            response = client.embeddings.create(
+                input=text,
+                model="text-embedding-3-large"
+            )
+            return response.data[0].embedding
+        # Generate embeddings for the incoming query
+        query_embedding = get_embeddings(self.client, query_text)
+        best_match = None
+        highest_similarity = 0
+        for main_query, similar_queries in Queries.items():
+            for query in similar_queries:
+                query = query.lower()
+                preset_embedding = get_embeddings(self.client, query)
+                similarity_score = cosine_similarity_calc(query_embedding, preset_embedding)
+                if similarity_score > highest_similarity:
+                    highest_similarity = similarity_score
+                    best_match = main_query
+        if highest_similarity >= 0.5100:
+            # print(f'Response from routing:query_text: {query_text} - best_match query: {best_match} - Doc: {Query_Doc_Map[best_match][0]}')
+            response, file_path = self.__generate_response_from_file(query_text, Query_Doc_Map[best_match][0])
+            return response, file_path
+        else:
+            return None, None
+    def __generate_response_from_file(self, query_text, file_path):
+        """
+        Generate response from a file.
+        """
+        def read_docx(file_path):
+            doc = Document(file_path)
+            full_text = []
+            for paragraph in doc.paragraphs:
+                full_text.append(paragraph.text)
+            return '\n'.join(full_text)
+        file_content = read_docx(os.path.join('../../Data', file_path))
+        system_prompt = '''
+        You are an intelligent assistant designed to provide clear, accurate, and helpful responses.
+        Focus on understanding user intent, give concise answers, and offer step-by-step solutions when necessary.
+        Be friendly, professional, and avoid unnecessary information.\n'''
+        input_prompt = f'Query: {query_text}\nContext: {file_content}'
+        response = generate_openai_response(input_prompt, system_prompt)
+        return response.split('\n')[1], os.path.join('../../Data', file_path)
     def query_chatbot(self, query_text, k=1, rerank=False): #, fetch_k=2, lambda_mult=0.5
         """
         Query the chatbot using the provided query text and optional search parameters.
         """
+        route_response, file_path = self.__route(query_text)
+        if route_response == None:
+            if rerank:
+                response, context_docs = self.data_query.query(
+                    query_text=query_text,
+                    k=k,
+                    reranker=self.reranker
+                )
+            else:
+                response = self.data_query.query(
+                    query_text=query_text,
+                    k=k,
+                )
+            return response, context_docs
         else:
+            return route_response, file_path

data_query.py CHANGED Viewed

@@ -8,11 +8,18 @@ from langchain.chains.combine_documents import create_stuff_documents_chain
 from langchain_core.prompts import ChatPromptTemplate
 from langchain_core.documents import Document
-def genetare_openai_response(input_prompt):
-    print(f'In genetare_openai_response')
-    system_prompt = '''You are an assistant designed to provide answers when no (0) relevant documents are retrieved from the vector database. When this happens, you should follow these steps:
-                    1) First, determine if you can answer the user's query using general knowledge or internal information. If so, generate a confident, helpful response in a straightforward narrative style. Do not use phrases such as 'According to me,' 'As of my knowledge,' 'I don’t know but,' or mention knowledge cutoffs or lack of information. Simply provide the answer as if you are certain of the facts.
-                    2) If the question is domain-specific, too specific (e.g., about a particular person or object that could mislead), or outside your knowledge, do not attempt to answer. Politely respond with: 'I'm sorry, I currently do not have enough information to answer your question.'''
     llm = ChatOpenAI(model="gpt-4o", api_key=os.getenv("OPENAI_API_KEY"))
     return 'The number of retrieved documents from RAG pipeline was 0, so the answer is based on LLM\s internal knowledge.\n' + llm(system_prompt+input_prompt).content
@@ -20,7 +27,16 @@ class ChatbotDataQuery:
     def __init__(self, vector_store):
         self.llm = ChatOpenAI(model="gpt-4o", api_key=os.getenv("OPENAI_API_KEY"))
-        self.system_prompt = '''You are Wagner, a highly intelligent and friendly AI assistant. More details on you are in a separate file: \'Who-is-Wagner-Chatbot-Response.docx\'.\n'''
         if vector_store is None:
             raise ValueError("Vector store cannot be None")
@@ -36,7 +52,7 @@ class ChatbotDataQuery:
     def __generate_response(self, query_text, retriever, reranker=None, reranker_docs=0):
         context_docs = retriever.invoke(query_text)
         if len(context_docs) == 0:
-            response = genetare_openai_response(input_prompt=query_text)
             return response
         context_docs_texts = [doc.page_content for doc in context_docs]
@@ -55,7 +71,7 @@ class ChatbotDataQuery:
             final_reranked_docs = []
             for reranked_doc in relevant_docs:
-                if reranked_doc['score'] < 0.50:
                     continue
                 else:
                     idx_of_content_in_context_doc = reranked_doc['result_index']
@@ -92,7 +108,8 @@ class ChatbotDataQuery:
         response = ''
         for chunk in self.llm.stream(query):
             response += chunk.content
-        return {'response': response, 'context_docs': context_docs}
             # yield chunk.content
         # return context_docs

 from langchain_core.prompts import ChatPromptTemplate
 from langchain_core.documents import Document
+def generate_openai_response(input_prompt, system_prompt=None):
+    if system_prompt is None:
+        system_prompt = '''You are an assistant designed to provide answers when no (0) relevant documents are retrieved from the vector database. When this happens, you should follow these steps:
+                        1) First, determine if you can answer the user's query using general knowledge or internal information. If so, generate a confident, helpful response in a straightforward narrative style. Do not use phrases such as 'According to me,' 'As of my knowledge,' 'I don’t know but,' or mention knowledge cutoffs or lack of information. Simply provide the answer as if you are certain of the facts.
+                        2) If the question is domain-specific, too specific (e.g., about a particular person or object that could mislead), or outside your knowledge, do not attempt to answer. Politely respond with: 'I'm sorry, I currently do not have enough information to answer your question.
+                        When asked about you, answer from the file(s):
+                        - Who-is-Wagner-Chatbot-Response.docx
+                        When asked about Daniel, answer from the file(s):
+                        - Ringel_Daniel_CV_V1.docx
+                        '''
     llm = ChatOpenAI(model="gpt-4o", api_key=os.getenv("OPENAI_API_KEY"))
     return 'The number of retrieved documents from RAG pipeline was 0, so the answer is based on LLM\s internal knowledge.\n' + llm(system_prompt+input_prompt).content
     def __init__(self, vector_store):
         self.llm = ChatOpenAI(model="gpt-4o", api_key=os.getenv("OPENAI_API_KEY"))
+        self.system_prompt = '''You are Wagner, a highly intelligent and friendly AI assistant.
+        You are developed to provide answers to given prompts about you, Daniel and Daniel's work. You will be given some context to generate the answer from to the user.
+        Answer in a very affirmative, concise, and clear manner. Never refuse to answer, always provide relevant information.
+        When asked about you, answer from the file(s):
+        - Who-is-Wagner-Chatbot-Response.docx
+        When asked about Daniel, answer from the file(s):
+        - Ringel_Daniel_CV_V1.docx
+        '''
         if vector_store is None:
             raise ValueError("Vector store cannot be None")
     def __generate_response(self, query_text, retriever, reranker=None, reranker_docs=0):
         context_docs = retriever.invoke(query_text)
         if len(context_docs) == 0:
+            response = generate_openai_response(input_prompt=query_text)
             return response
         context_docs_texts = [doc.page_content for doc in context_docs]
             final_reranked_docs = []
             for reranked_doc in relevant_docs:
+                if reranked_doc['score'] < 0.35:
                     continue
                 else:
                     idx_of_content_in_context_doc = reranked_doc['result_index']
         response = ''
         for chunk in self.llm.stream(query):
             response += chunk.content
+        return response, context_docs
+        # return {'response': response, 'context_docs': context_docs}
             # yield chunk.content
         # return context_docs