Spaces:
Runtime error
Runtime error
ambrosfitz
commited on
Update app.py
Browse files
app.py
CHANGED
@@ -7,7 +7,7 @@ import time
|
|
7 |
api_key = os.environ.get("RUNPOD_API_KEY") # Make sure your API key is correctly configured
|
8 |
client = OpenAI(
|
9 |
api_key=api_key,
|
10 |
-
base_url="https://api.runpod.ai/v2/vllm-
|
11 |
)
|
12 |
|
13 |
def get_response(user_message, history, verbosity):
|
@@ -25,7 +25,7 @@ def get_response(user_message, history, verbosity):
|
|
25 |
|
26 |
# Make the API call with a custom stop sequence
|
27 |
response = client.chat.completions.create(
|
28 |
-
model='ambrosfitz/autotrain-10k-llama3-history',
|
29 |
messages=history_openai_format,
|
30 |
temperature=temperature,
|
31 |
max_tokens=512,
|
|
|
7 |
api_key = os.environ.get("RUNPOD_API_KEY") # Make sure your API key is correctly configured
|
8 |
client = OpenAI(
|
9 |
api_key=api_key,
|
10 |
+
base_url="https://api.runpod.ai/v2/vllm-anqrwdpcywrdiz/openai/v1",
|
11 |
)
|
12 |
|
13 |
def get_response(user_message, history, verbosity):
|
|
|
25 |
|
26 |
# Make the API call with a custom stop sequence
|
27 |
response = client.chat.completions.create(
|
28 |
+
model='ambrosfitz/autotrain-10k-llama3-history-deep',
|
29 |
messages=history_openai_format,
|
30 |
temperature=temperature,
|
31 |
max_tokens=512,
|