Spaces:
Sleeping
Sleeping
File size: 2,749 Bytes
97caaf5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 |
import gradio as gr
from gradio import ChatMessage
import time
def simulate_thinking_chat(message: str, history: list) -> list:
"""Mimicking thinking process and response"""
# Add initial empty thinking message to chat history
history.append( # Adds new message to the chat history list
ChatMessage( # Creates a new chat message
role="assistant", # Specifies this is from the assistant
content="", # Initially empty content
metadata={"title": "💭 Thinking Process"} # Setting a thinking header here
)
)
time.sleep(1)
yield history # Returns current state of chat history
# Define the thoughts that LLM will "think" through
thoughts = [
"First, I need to understand the core aspects of the query...",
"Now, considering the broader context and implications...",
"Analyzing potential approaches to formulate a comprehensive answer...",
"Finally, structuring the response for clarity and completeness..."
]
# Variable to store all thoughts as they accumulate
accumulated_thoughts = ""
# Loop through each thought
for thought in thoughts:
time.sleep(0.5) # Add a samll delay for realism
# Add new thought to accumulated thoughts with markdown bullet point
accumulated_thoughts += f"- {thought}\n\n" # \n\n creates line breaks
# Update the thinking message with all thoughts so far
history[-1] = ChatMessage( # Updates last message in history
role="assistant",
content=accumulated_thoughts.strip(), # Remove extra whitespace
metadata={"title": "💭 Thinking Process"} # Shows thinking header
)
yield history # Returns updated chat history
# After thinking is complete, adding the final response
history.append(
ChatMessage(
role="assistant",
content="Based on my thoughts and analysis above, my response is: This dummy repro shows how thoughts of a thinking LLM can be progressively shown before providing its final answer."
)
)
yield history # Returns final state of chat history
# Gradio blocks with gr.chatbot
with gr.Blocks() as demo:
gr.Markdown("# Thinking LLM Demo 🤔")
chatbot = gr.Chatbot(type="messages", render_markdown=True)
msg = gr.Textbox(placeholder="Type your message...")
# Handling message submission here
msg.submit(
lambda m, h: (m, h + [ChatMessage(role="user", content=m)]),
[msg, chatbot],
[msg, chatbot]
).then(
simulate_thinking_chat,
[msg, chatbot],
chatbot
)
if __name__ == "__main__":
demo.launch() |