Spaces:

SUHHHH
/

openLLMchatbot

Sleeping

App Files Files Community

Kims12 commited on Sep 2, 2024

Commit

9f41ecc

verified ·

1 Parent(s): 7a6d838

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -36

app.py CHANGED Viewed

@@ -1,45 +1,21 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 import os
-import openai
-# 모델 목록에 chatgpt-4o-mini 추가
 MODELS = {
     "Zephyr 7B Beta": "HuggingFaceH4/zephyr-7b-beta",
     "DeepSeek Coder V2": "deepseek-ai/DeepSeek-Coder-V2-Instruct",
     "Meta Llama 3.1 8B": "meta-llama/Meta-Llama-3.1-8B-Instruct",
     "Mixtral 8x7B": "mistralai/Mixtral-8x7B-Instruct-v0.1",
     "Cohere Command R+": "CohereForAI/c4ai-command-r-plus",
-    "chatgpt-4o-mini": "chatgpt-4o-mini",  # OpenAI 모델 추가
 }
-# OpenAI API 클라이언트 설정
-openai.api_key = os.getenv("OPENAI_API_KEY")
 def get_client(model_name):
-    if model_name in MODELS:
-        model_id = MODELS[model_name]
-        if "chatgpt" in model_name:  # OpenAI 모델인 경우
-            return None  # InferenceClient 대신 None을 반환
-        hf_token = os.getenv("HF_TOKEN")
-        if not hf_token:
-            raise ValueError("HF_TOKEN environment variable is required")
-        return InferenceClient(model_id, token=hf_token)
-    else:
-        raise ValueError(f"Model {model_name} is not supported")
-def call_api(content, system_message, max_tokens, temperature, top_p):
-    response = openai.ChatCompletion.create(
-        model="gpt-4o-mini",
-        messages=[
-            {"role": "system", "content": system_message},
-            {"role": "user", "content": content},
-        ],
-        max_tokens=max_tokens,
-        temperature=temperature,
-        top_p=top_p,
-    )
-    return response.choices[0]['message']['content']
 def respond(
     message,
@@ -52,12 +28,6 @@ def respond(
 ):
     try:
         client = get_client(model_name)
-        if client is None and "chatgpt" in model_name:  # OpenAI 모델의 경우
-            assistant_message = call_api(message, system_message, max_tokens, temperature, top_p)
-            chat_history.append((message, assistant_message))
-            yield chat_history
-            return
     except ValueError as e:
         chat_history.append((message, str(e)))
         return chat_history
@@ -141,4 +111,4 @@ with gr.Blocks() as demo:
     clear_button.click(clear_conversation, outputs=chatbot, queue=False)
 if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
 from huggingface_hub import InferenceClient
 import os
 MODELS = {
     "Zephyr 7B Beta": "HuggingFaceH4/zephyr-7b-beta",
     "DeepSeek Coder V2": "deepseek-ai/DeepSeek-Coder-V2-Instruct",
     "Meta Llama 3.1 8B": "meta-llama/Meta-Llama-3.1-8B-Instruct",
     "Mixtral 8x7B": "mistralai/Mixtral-8x7B-Instruct-v0.1",
     "Cohere Command R+": "CohereForAI/c4ai-command-r-plus",
 }
 def get_client(model_name):
+    model_id = MODELS[model_name]
+    hf_token = os.getenv("HF_TOKEN")
+    if not hf_token:
+        raise ValueError("HF_TOKEN environment variable is required")
+    return InferenceClient(model_id, token=hf_token)
 def respond(
     message,
 ):
     try:
         client = get_client(model_name)
     except ValueError as e:
         chat_history.append((message, str(e)))
         return chat_history
     clear_button.click(clear_conversation, outputs=chatbot, queue=False)
 if __name__ == "__main__":
+    demo.launch()