ds

Sleeping

yangtb24 commited on Jan 21

Commit

44634fb

verified ·

1 Parent(s): 6e7818d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -425,7 +425,7 @@ def handsome_chat_completions():
                                         if delta.get("content") is not None:
                                             if not first_reasoning_chunk:
-                                                yield f"data: {json.dumps({'choices': [{'delta': {'content': '\n```'}, 'index': 0}]})}\n\n"
                                                 first_reasoning_chunk = True
                                             yield f"data: {json.dumps({'choices': [{'delta': {'content': delta["content"]}, 'index': 0}]})}\n\n"
@@ -525,7 +525,6 @@ def handsome_chat_completions():
                 content_type="text/event-stream"
             )
         else:
-            # ... (Non-streaming part remains the same as in the previous response)
             response.raise_for_status()
             end_time = time.time()
             response_json = response.json()
@@ -597,7 +596,6 @@ def handsome_chat_completions():
                 request_timestamps.append(time.time())
                 token_counts.append(prompt_tokens + completion_tokens)
-            # Reformat the response to standard OpenAI format for non-streaming responses
             formatted_response = {
                 "id": response_json.get("id", ""),
                 "object": "chat.completion",

                                         if delta.get("content") is not None:
                                             if not first_reasoning_chunk:
+                                                yield f"data: {json.dumps({'choices': [{'delta': {'content': '\n```\n'}, 'index': 0}]})}\n\n"
                                                 first_reasoning_chunk = True
                                             yield f"data: {json.dumps({'choices': [{'delta': {'content': delta["content"]}, 'index': 0}]})}\n\n"
                 content_type="text/event-stream"
             )
         else:
             response.raise_for_status()
             end_time = time.time()
             response_json = response.json()
                 request_timestamps.append(time.time())
                 token_counts.append(prompt_tokens + completion_tokens)
             formatted_response = {
                 "id": response_json.get("id", ""),
                 "object": "chat.completion",