Spaces:

Aborman
/

Scripts

Sleeping

App Files Files Community

Aborman commited on Dec 3, 2024

Commit

465fe5b

verified ·

1 Parent(s): 007f371

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

.gradio/flagged/dataset1.csv +3 -0
GradioLMstudioInterface.py +78 -68
lmstudio_gradio.py +202 -78

.gradio/flagged/dataset1.csv ADDED Viewed

	@@ -0,0 +1,3 @@

+user_input,history,output 0,history,timestamp
+Hi,,[],,2024-12-02 11:27:12.880943
+,,[],,2024-12-02 12:13:03.266406

GradioLMstudioInterface.py CHANGED Viewed

@@ -1,93 +1,103 @@
 import gradio as gr
 import requests
-# Base URL for LM Studio REST API
 BASE_URL = "http://localhost:1234/api/v0"
-# Chat completions function
-def chat_with_lmstudio(messages, model, temperature=0.7, max_tokens=150):
-    endpoint = f"{BASE_URL}/chat/completions"
     payload = {
-        "model": model,
         "messages": messages,
-        "temperature": temperature,
-        "max_tokens": max_tokens,
         "stream": False
     }
-    try:
-        response = requests.post(endpoint, json=payload)
-        response.raise_for_status()
-        data = response.json()
-        return data["choices"][0]["message"]["content"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Text completions function
-def text_completion(prompt, model, temperature=0.7, max_tokens=150):
-    endpoint = f"{BASE_URL}/completions"
     payload = {
-        "model": model,
         "prompt": prompt,
-        "temperature": temperature,
-        "max_tokens": max_tokens,
         "stream": False
     }
-    try:
-        response = requests.post(endpoint, json=payload)
-        response.raise_for_status()
-        data = response.json()
-        return data["choices"][0]["text"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Embeddings function
-def text_embedding(text, model):
-    endpoint = f"{BASE_URL}/embeddings"
     payload = {
-        "model": model,
         "input": text
     }
-    try:
-        response = requests.post(endpoint, json=payload)
-        response.raise_for_status()
-        data = response.json()
-        return data["data"][0]["embedding"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Gradio Interface
-def chat_interface(user_message, history, model="granite-3.0-2b-instruct"):
-    if history is None:
-        history = []
-    history.append({"role": "user", "content": user_message})
-    assistant_response = chat_with_lmstudio(history, model=model)
-    history.append({"role": "assistant", "content": assistant_response})
-    conversation = [(h["content"], history[i+1]["content"]) for i, h in enumerate(history[:-1]) if h["role"] == "user"]
-    return conversation, history
-with gr.Blocks() as demo:
-    gr.Markdown("# LM Studio API Interface")
-    with gr.Tab("Chat with Model"):
-        chat_history = gr.State([])
-        chat_model = gr.Textbox(value="granite-3.0-2b-instruct", label="Model")
-        chatbot = gr.Chatbot()
-        msg = gr.Textbox(placeholder="Enter your message", label="User Input")
-        submit_btn = gr.Button("Send")
-        submit_btn.click(chat_interface, inputs=[msg, chat_history, chat_model], outputs=[chatbot, chat_history])
-    with gr.Tab("Text Completion"):
-        completion_prompt = gr.Textbox(placeholder="Enter a prompt for text completion", label="Prompt")
-        completion_model = gr.Textbox(value="granite-3.0-2b-instruct", label="Model")
-        completion_output = gr.Textbox(label="Completion")
-        generate_btn = gr.Button("Generate")
-        generate_btn.click(text_completion, inputs=[completion_prompt, completion_model], outputs=completion_output)
-    with gr.Tab("Text Embeddings"):
-        embedding_text = gr.Textbox(placeholder="Enter text for embeddings", label="Input Text")
-        embedding_model = gr.Textbox(value="text-embedding-nomic-embed-text-v1.5", label="Model")
-        embedding_output = gr.JSON(label="Embeddings")
-        embed_btn = gr.Button("Get Embeddings")
-        embed_btn.click(text_embedding, inputs=[embedding_text, embedding_model], outputs=embedding_output)
     demo.launch(share=True)

 import gradio as gr
 import requests
+# LM Studio REST API base URL
 BASE_URL = "http://localhost:1234/api/v0"
+# Function to handle chat completions
+def chat_with_lmstudio(messages):
+    url = f"{BASE_URL}/chat/completions"
     payload = {
+        "model": "granite-3.0-2b-instruct",  # Replace with the model you have loaded
         "messages": messages,
+        "temperature": 0.7,
+        "max_tokens": 1024,
         "stream": False
     }
+    response = requests.post(url, json=payload)
+    response.raise_for_status()
+    response_data = response.json()
+    return response_data['choices'][0]['message']['content']
+# Function to handle text completions
+def get_text_completion(prompt):
+    url = f"{BASE_URL}/completions"
     payload = {
+        "model": "granite-3.0-2b-instruct",  # Replace with the model you have loaded
         "prompt": prompt,
+        "temperature": 0.7,
+        "max_tokens": 100,
         "stream": False
     }
+    response = requests.post(url, json=payload)
+    response.raise_for_status()
+    response_data = response.json()
+    return response_data['choices'][0]['text']
+# Function to handle text embeddings
+def get_text_embedding(text):
+    url = f"{BASE_URL}/embeddings"
     payload = {
+        "model": "text-embedding-nomic-embed-text-v1.5",  # Replace with your embedding model
         "input": text
     }
+    response = requests.post(url, json=payload)
+    response.raise_for_status()
+    response_data = response.json()
+    return response_data['data'][0]['embedding']
+# Gradio interface for chat
+def gradio_chat_interface():
+    def chat_interface(user_input, history):
+        # Format history in LM Studio messages format
+        messages = []
+        for user_msg, assistant_msg in history:
+            messages.append({"role": "user", "content": user_msg})
+            messages.append({"role": "assistant", "content": assistant_msg})
+        messages.append({"role": "user", "content": user_input})
+        # Get response from LM Studio
+        response = chat_with_lmstudio(messages)
+        # Update history with the assistant's response
+        history.append((user_input, response))
+        return history, history
+    chat_interface = gr.ChatInterface(chat_interface, type='messages')
+    chat_interface.launch(share=True)
+# Gradio interface for text completion
+def gradio_text_completion():
+    gr.Interface(
+        fn=get_text_completion,
+        inputs="text",
+        outputs="text",
+        title="Text Completion with LM Studio"
+    ).launch(share=True)
+# Gradio interface for text embedding
+def gradio_text_embedding():
+    gr.Interface(
+        fn=get_text_embedding,
+        inputs="text",
+        outputs="text",
+        title="Text Embedding with LM Studio"
+    ).launch(share=True)
+# Main menu to choose the interface
+def main():
+    with gr.Blocks() as demo:
+        gr.Markdown("""
+        # LM Studio API Interface
+        Choose which function you want to use with LM Studio:
+        """)
+        with gr.Row():
+            gr.Button("Chat with Model").click(gradio_chat_interface)
+            gr.Button("Text Completion").click(gradio_text_completion)
+            gr.Button("Text Embedding").click(gradio_text_embedding)
     demo.launch(share=True)
+if __name__ == "__main__":
+    main()

lmstudio_gradio.py CHANGED Viewed

@@ -1,93 +1,217 @@
 import gradio as gr
 import requests
-# Base URL for LM Studio REST API
-BASE_URL = "http://localhost:1234/api/v0"
-# Chat completions function
-def chat_with_lmstudio(messages, model, temperature=0.7, max_tokens=150):
-    endpoint = f"{BASE_URL}/chat/completions"
     payload = {
-        "model": model,
         "messages": messages,
-        "temperature": temperature,
-        "max_tokens": max_tokens,
-        "stream": False
     }
     try:
-        response = requests.post(endpoint, json=payload)
-        response.raise_for_status()
-        data = response.json()
-        return data["choices"][0]["message"]["content"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Text completions function
-def text_completion(prompt, model, temperature=0.7, max_tokens=150):
-    endpoint = f"{BASE_URL}/completions"
     payload = {
-        "model": model,
-        "prompt": prompt,
-        "temperature": temperature,
-        "max_tokens": max_tokens,
-        "stream": False
-    }
-    try:
-        response = requests.post(endpoint, json=payload)
-        response.raise_for_status()
-        data = response.json()
-        return data["choices"][0]["text"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Embeddings function
-def text_embedding(text, model):
-    endpoint = f"{BASE_URL}/embeddings"
-    payload = {
-        "model": model,
         "input": text
     }
     try:
-        response = requests.post(endpoint, json=payload)
         response.raise_for_status()
         data = response.json()
-        return data["data"][0]["embedding"]
-    except requests.RequestException as e:
-        return f"Error: {str(e)}"
-# Gradio Interface
-def chat_interface(user_message, history, model="granite-3.0-2b-instruct"):
-    if history is None:
-        history = []
-    history.append({"role": "user", "content": user_message})
-    assistant_response = chat_with_lmstudio(history, model=model)
-    history.append({"role": "assistant", "content": assistant_response})
-    conversation = [(h["content"], history[i+1]["content"]) for i, h in enumerate(history[:-1]) if h["role"] == "user"]
-    return conversation, history
-with gr.Blocks() as demo:
-    gr.Markdown("# LM Studio API Interface")
-    with gr.Tab("Chat with Model"):
-        chat_history = gr.State([])
-        chat_model = gr.Textbox(value="granite-3.0-2b-instruct", label="Model")
-        chatbot = gr.Chatbot()
-        msg = gr.Textbox(placeholder="Enter your message", label="User Input")
-        submit_btn = gr.Button("Send")
-        submit_btn.click(chat_interface, inputs=[msg, chat_history, chat_model], outputs=[chatbot, chat_history])
-    with gr.Tab("Text Completion"):
-        completion_prompt = gr.Textbox(placeholder="Enter a prompt for text completion", label="Prompt")
-        completion_model = gr.Textbox(value="granite-3.0-2b-instruct", label="Model")
-        completion_output = gr.Textbox(label="Completion")
-        generate_btn = gr.Button("Generate")
-        generate_btn.click(text_completion, inputs=[completion_prompt, completion_model], outputs=completion_output)
-    with gr.Tab("Text Embeddings"):
-        embedding_text = gr.Textbox(placeholder="Enter text for embeddings", label="Input Text")
-        embedding_model = gr.Textbox(value="text-embedding-nomic-embed-text-v1.5", label="Model")
-        embedding_output = gr.JSON(label="Embeddings")
-        embed_btn = gr.Button("Get Embeddings")
-        embed_btn.click(text_embedding, inputs=[embedding_text, embedding_model], outputs=embedding_output)
-    demo.launch(share=True)

 import gradio as gr
 import requests
+import logging
+import json
+import os
+import numpy as np
+# Set up logging to help troubleshoot issues
+logging.basicConfig(level=logging.DEBUG)
+# LM Studio REST API base URL
+BASE_URL = "http://localhost:1234/v1"
+# Function to handle chat completions with streaming support
+def chat_with_lmstudio(messages):
+    url = f"{BASE_URL}/chat/completions"
     payload = {
+        "model": "bartowski/Qwen2.5-Coder-32B-Instruct-GGUF/Qwen2.5-Coder-32B-Instruct-IQ2_M.gguf",  # Replace with your chat model
         "messages": messages,
+        "temperature": 0.7,
+        "max_tokens": 4096,
+        "stream": True
     }
+    logging.debug(f"Sending POST request to URL: {url}")
+    logging.debug(f"Payload: {json.dumps(payload, indent=2)}")
     try:
+        with requests.post(url, json=payload, stream=True) as response:
+            logging.debug(f"Response Status Code: {response.status_code}")
+            response.raise_for_status()
+            collected_response = ""
+            for chunk in response.iter_lines():
+                if chunk:
+                    chunk_data = chunk.decode('utf-8').strip()
+                    if chunk_data == "[DONE]":
+                        logging.debug("Received [DONE] signal. Ending stream.")
+                        break
+                    if chunk_data.startswith("data: "):
+                        chunk_data = chunk_data[6:].strip()
+                    logging.debug(f"Received Chunk: {chunk_data}")
+                    try:
+                        response_data = json.loads(chunk_data)
+                        if "choices" in response_data and len(response_data["choices"]) > 0:
+                            content = response_data['choices'][0].get('delta', {}).get('content', "")
+                            collected_response += content
+                            yield content
+                    except json.JSONDecodeError:
+                        logging.error(f"Failed to decode JSON from chunk: {chunk_data}")
+            if not collected_response:
+                yield "I'm sorry, I couldn't generate a response. Could you please try again?"
+    except requests.exceptions.RequestException as e:
+        logging.error(f"Request to LM Studio failed: {e}")
+        yield "An error occurred while connecting to LM Studio. Please try again later."
+# Function to get embeddings from LM Studio
+def get_embeddings(text):
+    url = f"{BASE_URL}/embeddings"
     payload = {
+        "model": "nomad_embed_text_v1_5_Q8_0",  # Use the exact model name registered in LM Studio
         "input": text
     }
+    logging.debug(f"Sending POST request to URL: {url}")
+    logging.debug(f"Payload: {json.dumps(payload, indent=2)}")
     try:
+        response = requests.post(url, json=payload)
         response.raise_for_status()
         data = response.json()
+        embedding = data['data'][0]['embedding']
+        logging.debug(f"Received Embedding: {embedding}")
+        return embedding
+    except requests.exceptions.RequestException as e:
+        logging.error(f"Request to LM Studio for embeddings failed: {e}")
+        return None
+# Function to calculate cosine similarity
+def cosine_similarity(vec1, vec2):
+    if not vec1 or not vec2:
+        return 0
+    vec1 = np.array(vec1)
+    vec2 = np.array(vec2)
+    if np.linalg.norm(vec1) == 0 or np.linalg.norm(vec2) == 0:
+        return 0
+    return np.dot(vec1, vec2) / (np.linalg.norm(vec1) * np.linalg.norm(vec2))
+# Gradio Blocks interface for chat with file upload and embeddings
+def gradio_chat_interface():
+    with gr.Blocks() as iface:
+        gr.Markdown("# Chat with LM Studio 🚀")
+        gr.Markdown("A chat interface powered by LM Studio. You can send text messages or upload files (e.g., `.txt`) to include in the conversation.")
+        chatbot = gr.Chatbot(type='messages')  # Specify 'messages' type to avoid deprecated tuple format
+        state = gr.State([])  # To store conversation history as list of dicts
+        embeddings_state = gr.State([])  # To store embeddings
+        with gr.Row():
+            with gr.Column(scale=4):
+                user_input = gr.Textbox(
+                    label="Type your message here",
+                    placeholder="Enter text and press enter",
+                    lines=1
+                )
+            with gr.Column(scale=1):
+                file_input = gr.File(
+                    label="Upload a file",
+                    file_types=[".txt"],  # Restrict to text files; modify as needed
+                    type="binary"  # Corrected from 'file' to 'binary'
+                )
+        send_button = gr.Button("Send")
+        # Function to handle chat interactions
+        def chat_interface(user_message, uploaded_file, history, embeddings):
+            # Initialize history and embeddings if None
+            if history is None:
+                history = []
+            if embeddings is None:
+                embeddings = []
+            # Process uploaded file if present
+            if uploaded_file is not None:
+                try:
+                    # Read the uploaded file's content
+                    file_content = uploaded_file.read().decode('utf-8')
+                    user_message += f"\n\n[File Content]:\n{file_content}"
+                    logging.debug(f"Processed uploaded file: {uploaded_file.name}")
+                    # Generate embedding for the file content
+                    file_embedding = get_embeddings(file_content)
+                    if file_embedding:
+                        embeddings.append((file_content, file_embedding))
+                        logging.debug(f"Stored embedding for uploaded file: {uploaded_file.name}")
+                except Exception as e:
+                    logging.error(f"Error reading uploaded file: {e}")
+                    user_message += "\n\n[Error reading the uploaded file.]"
+            # Generate embedding for the user message
+            user_embedding = get_embeddings(user_message)
+            if user_embedding:
+                embeddings.append((user_message, user_embedding))
+                logging.debug("Stored embedding for user message.")
+            # Retrieve relevant context based on embeddings (optional)
+            # For demonstration, we'll retrieve top 2 similar past messages
+            context_messages = []
+            if embeddings:
+                similarities = []
+                for idx, (text, embed) in enumerate(embeddings[:-1]):  # Exclude the current user message
+                    sim = cosine_similarity(user_embedding, embed)
+                    similarities.append((sim, idx))
+                # Sort by similarity
+                similarities.sort(reverse=True, key=lambda x: x[0])
+                top_n = 2
+                top_indices = [idx for (_, idx) in similarities[:top_n]]
+                for idx in top_indices:
+                    context_messages.append(history[idx]['content'])  # Append user messages as context
+            # Append user message to history
+            history.append({"role": "user", "content": user_message})
+            logging.debug(f"Updated History: {history}")
+            # Format history with additional context
+            messages = []
+            if context_messages:
+                messages.append({"role": "system", "content": "You have the following context:"})
+                for ctx in context_messages:
+                    messages.append({"role": "user", "content": ctx})
+                messages.append({"role": "system", "content": "Use this context to assist the user."})
+            # Append all messages from history
+            messages.extend(history)
+            # Get response from LM Studio
+            response_stream = chat_with_lmstudio(messages)
+            response = ""
+            # To handle streaming, we'll initialize the assistant message and update it incrementally
+            assistant_message = {"role": "assistant", "content": ""}
+            history.append(assistant_message)
+            logging.debug(f"Appended empty assistant message: {assistant_message}")
+            for chunk in response_stream:
+                response += chunk
+                # Update the assistant message content
+                assistant_message['content'] = response
+                logging.debug(f"Updated assistant message: {assistant_message}")
+                # Yield the updated history and embeddings
+                yield history, embeddings
+            # Finalize the history with the complete response
+            assistant_message['content'] = response
+            logging.debug(f"Final assistant message: {assistant_message}")
+            yield history, embeddings
+        # Connect the send button to the chat function
+        send_button.click(
+            fn=chat_interface,
+            inputs=[user_input, file_input, state, embeddings_state],
+            outputs=[chatbot, embeddings_state],
+            queue=True  # Enable queuing for handling multiple requests
+        )
+        # Also allow pressing Enter in the textbox to send the message
+        user_input.submit(
+            fn=chat_interface,
+            inputs=[user_input, file_input, state, embeddings_state],
+            outputs=[chatbot, embeddings_state],
+            queue=True
+        )
+        # Add debug statements to determine file pattern issues
+        logging.debug(f"Current working directory: {os.getcwd()}")
+        logging.debug(f"Files in current directory: {os.listdir(os.getcwd())}")
+    iface.launch(share=True)
+# Main function to launch the chat interface
+if __name__ == "__main__":
+    gradio_chat_interface()