ds

Running

App Files Files Community

yangtb24 commited on Jan 21

Commit

869de0e

verified ·

1 Parent(s): 199c193

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -21

app.py CHANGED Viewed

@@ -433,6 +433,7 @@ def handsome_chat_completions():
                 full_response_content = ""
                 reasoning_content_accumulated = ""  # Accumulate reasoning content
                 content_accumulated = ""  # Accumulate regular content
                 for chunk in response.iter_content(chunk_size=1024):
                     if chunk:
@@ -440,25 +441,32 @@ def handsome_chat_completions():
                             first_chunk_time = time.time()
                         full_response_content += chunk.decode("utf-8")
-                        try:
-                            chunk_json = json.loads(chunk.decode("utf-8").lstrip("data: ").strip())
-                            if "choices" in chunk_json and len(chunk_json["choices"]) > 0:
-                                delta = chunk_json["choices"][0].get("delta", {})
-                                if delta.get("reasoning_content") is not None:
-                                    reasoning_content_accumulated += delta.get("reasoning_content", "")
-                                    formatted_reasoning = f"{reasoning_content_accumulated}"
-                                    yield f"data: {json.dumps({'choices': [{'delta': {'content': formatted_reasoning}, 'index': 0, 'finish_reason': None}]})}\n\n"
-                                    reasoning_content_accumulated = ""
-                                if delta.get("content") is not None:
-                                    content_accumulated += delta.get("content", "")
-                                    yield f"data: {json.dumps({'choices': [{'delta': {'content': content_accumulated}, 'index': 0, 'finish_reason': None}]})}\n\n"
-                                    content_accumulated = ""
-                        except (KeyError, ValueError, json.JSONDecodeError) as e:
-                            logging.error(f"解析流式响应单行 JSON 失败: {e}, 行内容: {chunk.decode('utf-8')}")
-                            continue
                 end_time = time.time()
                 first_token_time = (
@@ -652,7 +660,6 @@ def handsome_chat_completions():
         logging.error(f"请求转发异常: {e}")
         return jsonify({"error": str(e)}), 500
 if __name__ == '__main__':
     logging.info(f"环境变量：{os.environ}")
@@ -673,4 +680,4 @@ if __name__ == '__main__':
         debug=False,
         host='0.0.0.0',
         port=int(os.environ.get('PORT', 7860))
-    )

                 full_response_content = ""
                 reasoning_content_accumulated = ""  # Accumulate reasoning content
                 content_accumulated = ""  # Accumulate regular content
+                first_reasoning_chunk = True # Flag to track the first reasoning chunk
                 for chunk in response.iter_content(chunk_size=1024):
                     if chunk:
                             first_chunk_time = time.time()
                         full_response_content += chunk.decode("utf-8")
+                        for line in chunk.decode("utf-8").splitlines():
+                            if line.startswith("data:"):
+                                try:
+                                    chunk_json = json.loads(line.lstrip("data: ").strip())
+                                    if "choices" in chunk_json and len(chunk_json["choices"]) > 0:
+                                        delta = chunk_json["choices"][0].get("delta", {})
+                                        if delta.get("reasoning_content") is not None:
+                                            if first_reasoning_chunk:
+                                                reasoning_content_accumulated += "```Thinking\n"
+                                                first_reasoning_chunk = False
+                                            reasoning_content_accumulated += delta.get("reasoning_content", "")
+                                        if delta.get("content") is not None:
+                                            if not first_reasoning_chunk:
+                                              reasoning_content_accumulated += "\n```"
+                                              first_reasoning_chunk = True
+                                            content_accumulated += delta.get("content", "")
+                                            yield f"data: {json.dumps({'choices': [{'delta': {'content': (reasoning_content_accumulated if reasoning_content_accumulated else '') + content_accumulated}, 'index': 0, 'finish_reason': None}]})}\n\n"
+                                            reasoning_content_accumulated = ""
+                                            content_accumulated = ""
+                                except (KeyError, ValueError, json.JSONDecodeError) as e:
+                                    logging.error(f"解析流式响应单行 JSON 失败: {e}, 行内容: {line}")
+                                    continue
                 end_time = time.time()
                 first_token_time = (
         logging.error(f"请求转发异常: {e}")
         return jsonify({"error": str(e)}), 500
 if __name__ == '__main__':
     logging.info(f"环境变量：{os.environ}")
         debug=False,
         host='0.0.0.0',
         port=int(os.environ.get('PORT', 7860))
+    )