Spaces:

IntellijMind
/

chat-llm

Runtime error

App Files Files Community

Threatthriver commited on Aug 28

Commit

e7f3548

•

1 Parent(s): 09fa947

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -19

app.py CHANGED Viewed

@@ -4,6 +4,16 @@ from huggingface_hub import InferenceClient
 # Initialize the InferenceClient with the model ID from Hugging Face
 client = InferenceClient(model="HuggingFaceH4/zephyr-7b-beta")
 def respond(
     message: str,
     history: list[tuple[str, str]],
@@ -14,7 +24,7 @@ def respond(
 ):
     """
     Generates a response from the AI model based on the user's message and chat history.
     Args:
         message (str): The user's input message.
         history (list): A list of tuples representing the conversation history (user, assistant).
@@ -26,46 +36,48 @@ def respond(
     Yields:
         str: The AI's response as it is generated.
     """
     # Prepare the conversation history for the API call
     messages = [{"role": "system", "content": system_message}]
     for user_input, assistant_response in history:
-        if user_input:
-            messages.append({"role": "user", "content": user_input})
-        if assistant_response:
-            messages.append({"role": "assistant", "content": assistant_response})
     # Add the latest user message to the conversation
     messages.append({"role": "user", "content": message})
     # Initialize an empty response
-    response = ""
     try:
         # Generate a response from the model with streaming
-        for message in client.chat_completion(
             messages=messages,
             max_tokens=max_tokens,
             stream=True,
             temperature=temperature,
             top_p=top_p,
         ):
-            token = message.choices[0].delta.content
-            response += token
-            yield response
     except Exception as e:
-        yield f"An error occurred: {str(e)}"
-# Define the ChatInterface with additional input components for user customization
 demo = gr.ChatInterface(
     fn=respond,
     additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(
             minimum=0.1,
             maximum=1.0,
@@ -74,10 +86,22 @@ demo = gr.ChatInterface(
             label="Top-p (nucleus sampling)",
         ),
     ],
-    title="Chatbot Interface",
-    description="A customizable chatbot interface using Hugging Face's Inference API.",
 )
 # Launch the Gradio interface
 if __name__ == "__main__":
-    demo.launch()

 # Initialize the InferenceClient with the model ID from Hugging Face
 client = InferenceClient(model="HuggingFaceH4/zephyr-7b-beta")
+# Latest updates (you can replace this with actual update information)
+latest_updates = """
+**Zephyr 7B Beta Chatbot - Latest Updates:**
+* **Improved Error Handling:** The chatbot now provides clearer error messages if something goes wrong.
+* **Enhanced System Message Input:** You can now provide multi-line system messages to guide the AI's behavior.
+* **Optimized Temperature Range:** The temperature slider's range has been adjusted for better control over randomness.
+* **Robust Chunk Handling:** The chatbot now handles streamed responses more reliably, even if some chunks are missing content.
+"""
 def respond(
     message: str,
     history: list[tuple[str, str]],
 ):
     """
     Generates a response from the AI model based on the user's message and chat history.
     Args:
         message (str): The user's input message.
         history (list): A list of tuples representing the conversation history (user, assistant).
     Yields:
         str: The AI's response as it is generated.
     """
     # Prepare the conversation history for the API call
     messages = [{"role": "system", "content": system_message}]
     for user_input, assistant_response in history:
+        messages.append({"role": "user", "content": user_input})
+        messages.append({"role": "assistant", "content": assistant_response})
     # Add the latest user message to the conversation
     messages.append({"role": "user", "content": message})
     # Initialize an empty response
+    streamed_response = ""
     try:
         # Generate a response from the model with streaming
+        for response in client.chat_completion(
             messages=messages,
             max_tokens=max_tokens,
             stream=True,
             temperature=temperature,
             top_p=top_p,
         ):
+            chunk = response.choices[0].delta.get("content", "")
+            streamed_response += chunk
+            yield streamed_response
     except Exception as e:
+        yield f"**Error:** {str(e)}"
+# Define the ChatInterface with additional input components
 demo = gr.ChatInterface(
     fn=respond,
     additional_inputs=[
+        gr.Textbox(
+            value="You are a friendly and helpful assistant.",
+            label="System message",
+            lines=2
+        ),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
+        gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(
             minimum=0.1,
             maximum=1.0,
             label="Top-p (nucleus sampling)",
         ),
     ],
+    title="Zephyr 7B Beta Chatbot",
+    description="A customizable chatbot interface using Hugging Face's Zephyr 7B Beta model and Inference API.",
+)
+# Add the "Show Updates" button and output area
+with gr.Row():
+    updates_button = gr.Button("Show Latest Updates")
+    updates_output = gr.Markdown(visible=False)  # Initially hidden
+# Define the button's click event
+updates_button.click(
+    fn=lambda: latest_updates,
+    outputs=updates_output,
+    show_progress=False
 )
 # Launch the Gradio interface
 if __name__ == "__main__":
+    demo.launch()