Spaces:

ChristopherMarais
/

AMAbot

Sleeping

App Files Files Community

ChristopherMarais commited on Feb 25

Commit

ab16bf8

verified ·

1 Parent(s): 25de2c4

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -6

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ from cryptography.fernet import Fernet
 # --- LangChain / RAG Imports ---
 from langchain_community.vectorstores import FAISS
 from langchain.chains import ConversationalRetrievalChain
-from langchain.memory import ConversationBufferMemory
 from langchain_huggingface import HuggingFaceEmbeddings, HuggingFaceEndpoint
 def load_decrypted_preprompt(file_path="pre_prompt.enc"):
@@ -71,9 +71,10 @@ def initialize_qa_chain(temperature, max_tokens, top_k, vector_db):
         task="text-generation"
     )
-    memory = ConversationBufferMemory(
         memory_key="chat_history",
-        output_key="answer",
         return_messages=True
     )
@@ -118,19 +119,21 @@ def update_chat(message, history):
 def get_assistant_response(message, history, max_tokens, temperature, top_p, qa_chain_state_dict):
     """
     Generate the assistant's response using the QA chain (if available) or fallback to plain chat.
-    Assumes that the user's message is already appended to the history.
     """
     qa_chain = qa_chain_state_dict.get("qa_chain")
     if qa_chain is not None:
         # Format history to the plain-text format expected by the QA chain
         formatted_history = format_chat_history(history)
-        response = qa_chain.invoke({"question": message, "chat_history": formatted_history})
         answer = response.get("answer", "")
         history.append({"role": "assistant", "content": answer})
         return history, {"qa_chain": qa_chain}
-    # Fallback: Plain Chat Mode using the InferenceClient
     messages = [{"role": "system", "content": PRE_PROMPT}] + history
     response = ""
     result = client.chat_completion(
@@ -147,6 +150,7 @@ def get_assistant_response(message, history, max_tokens, temperature, top_p, qa_
     history.append({"role": "assistant", "content": response})
     return history, {"qa_chain": qa_chain}
 # Global InferenceClient for plain chat (fallback)
 client = InferenceClient("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B")

 # --- LangChain / RAG Imports ---
 from langchain_community.vectorstores import FAISS
 from langchain.chains import ConversationalRetrievalChain
+from langchain.memory import ConversationSummaryMemory #ConversationBufferMemory
 from langchain_huggingface import HuggingFaceEmbeddings, HuggingFaceEndpoint
 def load_decrypted_preprompt(file_path="pre_prompt.enc"):
         task="text-generation"
     )
+    memory = ConversationSummaryMemory(
+        llm=llm,
+        max_token_limit=500,   # Adjust this to control the summary size
         memory_key="chat_history",
         return_messages=True
     )
 def get_assistant_response(message, history, max_tokens, temperature, top_p, qa_chain_state_dict):
     """
     Generate the assistant's response using the QA chain (if available) or fallback to plain chat.
+    The pre-prompt is always included by concatenating it to the user's new question.
     """
     qa_chain = qa_chain_state_dict.get("qa_chain")
     if qa_chain is not None:
         # Format history to the plain-text format expected by the QA chain
         formatted_history = format_chat_history(history)
+        # Prepend the pre-prompt to the current question
+        combined_question = PRE_PROMPT + "\n" + message
+        response = qa_chain.invoke({"question": combined_question, "chat_history": formatted_history})
         answer = response.get("answer", "")
         history.append({"role": "assistant", "content": answer})
         return history, {"qa_chain": qa_chain}
+    # Fallback: Plain Chat Mode using the InferenceClient (pre-prompt already included here)
     messages = [{"role": "system", "content": PRE_PROMPT}] + history
     response = ""
     result = client.chat_completion(
     history.append({"role": "assistant", "content": response})
     return history, {"qa_chain": qa_chain}
 # Global InferenceClient for plain chat (fallback)
 client = InferenceClient("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B")