legalaid-chat

Running

App Files Files Community

github-actions commited on Aug 3

Commit

7873f3c

•

1 Parent(s): d4d8ea9

Sync updates from source repository

Browse files

Files changed (3) hide show

app.py +84 -5
query.py +8 -7
requirements.txt +2 -0

app.py CHANGED Viewed

@@ -1,13 +1,59 @@
 from omegaconf import OmegaConf
 from query import VectaraQuery
 import os
 import streamlit as st
 from streamlit_pills import pills
 from PIL import Image
 max_examples = 6
 def isTrue(x) -> bool:
     if isinstance(x, bool):
@@ -16,11 +62,11 @@ def isTrue(x) -> bool:
 def launch_bot():
     def generate_response(question):
-        response = vq.submit_query(question)
         return response
     def generate_streaming_response(question):
-        response = vq.submit_query_streaming(question)
         return response
     def show_example_questions():
@@ -41,11 +87,13 @@ def launch_bot():
             'source_data_desc': os.environ['source_data_desc'],
             'streaming': isTrue(os.environ.get('streaming', False)),
             'prompt_name': os.environ.get('prompt_name', None),
-            'examples': os.environ.get('examples', None)
         })
         st.session_state.cfg = cfg
         st.session_state.ex_prompt = None
-        st.session_state.first_turn = True
         example_messages = [example.strip() for example in cfg.examples.split(",")]
         st.session_state.example_messages = [em for em in example_messages if len(em)>0][:max_examples]
@@ -60,7 +108,13 @@ def launch_bot():
         image = Image.open('Vectara-logo.png')
         st.image(image, width=175)
         st.markdown(f"## About\n\n"
-                    f"This demo uses Retrieval Augmented Generation to ask questions about {cfg.source_data_desc}\n\n")
         st.markdown("---")
         st.markdown(
@@ -111,7 +165,32 @@ def launch_bot():
                     st.write(response)
             message = {"role": "assistant", "content": response}
             st.session_state.messages.append(message)
             st.rerun()
 if __name__ == "__main__":
     launch_bot()

 from omegaconf import OmegaConf
 from query import VectaraQuery
 import os
+import requests
+import json
+import uuid
 import streamlit as st
 from streamlit_pills import pills
+from streamlit_feedback import streamlit_feedback
 from PIL import Image
 max_examples = 6
+languages = {'English': 'eng', 'Spanish': 'spa', 'French': 'frs', 'Chinese': 'zho', 'German': 'deu', 'Hindi': 'hin', 'Arabic': 'ara',
+             'Portuguese': 'por', 'Italian': 'ita', 'Japanese': 'jpn', 'Korean': 'kor', 'Russian': 'rus', 'Turkish': 'tur', 'Persian (Farsi)': 'fas',
+             'Vietnamese': 'vie', 'Thai': 'tha', 'Hebrew': 'heb', 'Dutch': 'nld', 'Indonesian': 'ind', 'Polish': 'pol', 'Ukrainian': 'ukr',
+             'Romanian': 'ron', 'Swedish': 'swe', 'Czech': 'ces', 'Greek': 'ell', 'Bengali': 'ben', 'Malay (or Malaysian)': 'msa', 'Urdu': 'urd'}
+# Setup for HTTP API Calls to Amplitude Analytics
+if 'device_id' not in st.session_state:
+    st.session_state.device_id = str(uuid.uuid4())
+headers = {
+    'Content-Type': 'application/json',
+    'Accept': '*/*'
+}
+amp_api_key = os.getenv('AMPLITUDE_TOKEN')
+def thumbs_feedback(feedback, **kwargs):
+    """
+    Sends feedback to Amplitude Analytics
+    """
+    data = {
+            "api_key": amp_api_key,
+            "events": [{
+                "device_id": st.session_state.device_id,
+                "event_type": "provided_feedback",
+                "event_properties": {
+                    "Space Name": kwargs.get("title", "Unknown Space Name"),
+                    "Demo Type": "chatbot",
+                    "query": kwargs.get("prompt", "No user input"),
+                    "response": kwargs.get("response", "No chat response"),
+                    "feedback": feedback["score"],
+                    "Response Language": st.session_state.language
+                }
+            }]
+        }
+    response = requests.post('https://api2.amplitude.com/2/httpapi', headers=headers, data=json.dumps(data))
+    if response.status_code != 200:
+        print(f"Request failed with status code {response.status_code}. Response Text: {response.text}")
+    st.session_state.feedback_key += 1
+if "feedback_key" not in st.session_state:
+        st.session_state.feedback_key = 0
 def isTrue(x) -> bool:
     if isinstance(x, bool):
 def launch_bot():
     def generate_response(question):
+        response = vq.submit_query(question, languages[st.session_state.language])
         return response
     def generate_streaming_response(question):
+        response = vq.submit_query_streaming(question, languages[st.session_state.language])
         return response
     def show_example_questions():
             'source_data_desc': os.environ['source_data_desc'],
             'streaming': isTrue(os.environ.get('streaming', False)),
             'prompt_name': os.environ.get('prompt_name', None),
+            'examples': os.environ.get('examples', None),
+            'language': 'English'
         })
         st.session_state.cfg = cfg
         st.session_state.ex_prompt = None
+        st.session_state.first_turn = True
+        st.session_state.language = cfg.language
         example_messages = [example.strip() for example in cfg.examples.split(",")]
         st.session_state.example_messages = [em for em in example_messages if len(em)>0][:max_examples]
         image = Image.open('Vectara-logo.png')
         st.image(image, width=175)
         st.markdown(f"## About\n\n"
+                    f"This demo uses Retrieval Augmented Generation to ask questions about {cfg.source_data_desc}\n")
+        cfg.language = st.selectbox('Language:', languages.keys())
+        if st.session_state.language != cfg.language:
+            st.session_state.language = cfg.language
+            print(f"DEBUG: Language changed to {st.session_state.language}")
+            st.rerun()
         st.markdown("---")
         st.markdown(
                     st.write(response)
             message = {"role": "assistant", "content": response}
             st.session_state.messages.append(message)
+            # Send query and response to Amplitude Analytics
+            data = {
+                "api_key": amp_api_key,
+                "events": [{
+                    "device_id": st.session_state.device_id,
+                    "event_type": "submitted_query",
+                    "event_properties": {
+                        "Space Name": cfg["title"],
+                        "Demo Type": "chatbot",
+                        "query": st.session_state.messages[-2]["content"],
+                        "response": st.session_state.messages[-1]["content"],
+                        "Response Language": st.session_state.language
+                    }
+                }]
+            }
+            response = requests.post('https://api2.amplitude.com/2/httpapi', headers=headers, data=json.dumps(data))
+            if response.status_code != 200:
+                print(f"Amplitude request failed with status code {response.status_code}. Response Text: {response.text}")
             st.rerun()
+    if (st.session_state.messages[-1]["role"] == "assistant") & (st.session_state.messages[-1]["content"] != "How may I help you?"):
+        streamlit_feedback(feedback_type="thumbs", on_submit = thumbs_feedback, key = st.session_state.feedback_key,
+                                      kwargs = {"prompt": st.session_state.messages[-2]["content"],
+                                                "response": st.session_state.messages[-1]["content"],
+                                                "title": cfg["title"]})
 if __name__ == "__main__":
     launch_bot()

query.py CHANGED Viewed

@@ -10,7 +10,7 @@ class VectaraQuery():
         self.conv_id = None
-    def get_body(self, query_str: str, stream: False):
         corpora_list = [{
                 'corpus_key': corpus_key, 'lexical_interpolation': 0.005
             } for corpus_key in self.corpus_keys
@@ -40,11 +40,12 @@ class VectaraQuery():
             {
                 'prompt_name': self.prompt_name,
                 'max_used_search_results': 10,
-                'response_language': 'eng',
                 'citations':
                 {
                     'style': 'none'
-                }
             },
             'chat':
             {
@@ -70,14 +71,14 @@ class VectaraQuery():
             "grpc-timeout": "60S"
         }
-    def submit_query(self, query_str: str):
         if self.conv_id:
             endpoint = f"https://api.vectara.io/v2/chats/{self.conv_id}/turns"
         else:
             endpoint = "https://api.vectara.io/v2/chats"
-        body = self.get_body(query_str, stream=False)
         response = requests.post(endpoint, data=json.dumps(body), verify=True, headers=self.get_headers())
@@ -96,14 +97,14 @@ class VectaraQuery():
         return summary
-    def submit_query_streaming(self, query_str: str):
         if self.conv_id:
             endpoint = f"https://api.vectara.io/v2/chats/{self.conv_id}/turns"
         else:
             endpoint = "https://api.vectara.io/v2/chats"
-        body = self.get_body(query_str, stream=True)
         response = requests.post(endpoint, data=json.dumps(body), verify=True, headers=self.get_stream_headers(), stream=True)

         self.conv_id = None
+    def get_body(self, query_str: str, response_lang: str, stream: False):
         corpora_list = [{
                 'corpus_key': corpus_key, 'lexical_interpolation': 0.005
             } for corpus_key in self.corpus_keys
             {
                 'prompt_name': self.prompt_name,
                 'max_used_search_results': 10,
+                'response_language': response_lang,
                 'citations':
                 {
                     'style': 'none'
+                },
+                'enable_factual_consistency_score': False
             },
             'chat':
             {
             "grpc-timeout": "60S"
         }
+    def submit_query(self, query_str: str, language: str):
         if self.conv_id:
             endpoint = f"https://api.vectara.io/v2/chats/{self.conv_id}/turns"
         else:
             endpoint = "https://api.vectara.io/v2/chats"
+        body = self.get_body(query_str, language, stream=False)
         response = requests.post(endpoint, data=json.dumps(body), verify=True, headers=self.get_headers())
         return summary
+    def submit_query_streaming(self, query_str: str, language: str):
         if self.conv_id:
             endpoint = f"https://api.vectara.io/v2/chats/{self.conv_id}/turns"
         else:
             endpoint = "https://api.vectara.io/v2/chats"
+        body = self.get_body(query_str, language, stream=True)
         response = requests.post(endpoint, data=json.dumps(body), verify=True, headers=self.get_stream_headers(), stream=True)

requirements.txt CHANGED Viewed

@@ -3,3 +3,5 @@ toml==0.10.2
 omegaconf==2.3.0
 syrupy==4.0.8
 streamlit_pills==0.3.0

 omegaconf==2.3.0
 syrupy==4.0.8
 streamlit_pills==0.3.0
+streamlit-feedback==0.1.3
+uuid==1.30