preamble

2025-11-28 09:04:01 +08:00 · 2025-11-28 09:04:01 +08:00 · fb34d45735
commit fb34d45735
parent dfe0439894
3 changed files with 24 additions and 145 deletions
--- a/prompt/preamble_prompt.md
+++ b/prompt/preamble_prompt.md
@ -9,7 +9,7 @@ FIRST, determine if this is a COMPLEX scenario that requires a preamble:
 **Complex Scenarios (preamble needed):**
 - Query scenarios: User is asking for information, searching, or looking up data
 - Action scenarios: User wants to perform an operation, execute a task  
- Knowledge retrieval scenarios: User needs to search knowledge base, documents, or databases
+- Knowledge retrieval scenarios: User needs to search knowledge base, documents、databases or Internet
 - Problem-solving: User is reporting issues, asking for help with problems
 - Complex requests: Multi-step tasks, detailed instructions needed

--- a/routes/chat.py
+++ b/routes/chat.py
@ -16,7 +16,8 @@ from utils.api_models import ChatRequestV2
 from utils.fastapi_utils import (
    process_messages, extract_block_from_system_prompt, format_messages_to_chat_history,
    create_project_directory, extract_api_key_from_auth, generate_v2_auth_token, fetch_bot_config,
-    call_guideline_llm, _get_optimal_batch_size, process_guideline_batch, get_content_from_messages, call_preamble_llm, get_preamble_text, get_language_text
+    call_guideline_llm, _get_optimal_batch_size, process_guideline_batch, get_content_from_messages, call_preamble_llm, get_preamble_text, get_language_text,
+    create_stream_chunk
 )

 router = APIRouter()
@ -56,97 +57,6 @@ def append_user_last_message(messages: list, content: str) -> bool:
    return messages


-async def generate_stream_response(agent, messages, pre_message_list, tool_response: bool, model: str):
-    """生成流式响应"""
-    accumulated_content = ""
-
-
-    chunk_id = 0
-    try:
-
-        if len(pre_message_list)>0:
-            accumulated_content = get_content_from_messages(pre_message_list, tool_response=tool_response)
-            chunk_data = {
-                "id": f"chatcmpl-thought",
-                "object": "chat.completion.chunk",
-                "created": int(__import__('time').time()),
-                "model": model,
-                "choices": [{
-                    "index": 0,
-                    "delta": {
-                        "content": accumulated_content
-                    },
-                    "finish_reason": None
-                }]
-            }
-            yield f"data: {json.dumps(chunk_data, ensure_ascii=False)}\n\n"
-
-        logger.info(f"开始生成Agent流式响应, model: {model}")
-        for response in agent.run(messages=messages):
-            previous_content = accumulated_content
-            accumulated_content = get_content_from_messages(response, tool_response=tool_response)
-            
-            # 计算新增的内容
-            if accumulated_content.startswith(previous_content):
-                new_content = accumulated_content[len(previous_content):]
-            else:
-                new_content = accumulated_content
-                previous_content = ""
-            
-            # 只有当有新内容时才发送chunk
-            if new_content:
-                if chunk_id == 0:
-                    logger.info(f"Agent首个Token已生成, 开始流式输出")
-                chunk_id += 1
-                # 构造OpenAI格式的流式响应
-                chunk_data = {
-                    "id": f"chatcmpl-{chunk_id}",
-                    "object": "chat.completion.chunk",
-                    "created": int(__import__('time').time()),
-                    "model": model,
-                    "choices": [{
-                        "index": 0,
-                        "delta": {
-                            "content": new_content
-                        },
-                        "finish_reason": None
-                    }]
-                }
-                    
-                yield f"data: {json.dumps(chunk_data, ensure_ascii=False)}\n\n"
-        
-        # 发送最终完成标记
-        final_chunk = {
-            "id": f"chatcmpl-{chunk_id + 1}",
-            "object": "chat.completion.chunk",
-            "created": int(__import__('time').time()),
-            "model": model,
-            "choices": [{
-                "index": 0,
-                "delta": {},
-                "finish_reason": "stop"
-            }]
-        }
-        yield f"data: {json.dumps(final_chunk, ensure_ascii=False)}\n\n"
-        
-        # 发送结束标记
-        yield "data: [DONE]\n\n"
-        logger.info(f"Agent流式响应完成, 总共生成 {chunk_id} 个chunks")
-    except Exception as e:
-        import traceback
-        error_details = traceback.format_exc()
-
-        logger.error(f"Error in generate_stream_response: {str(e)}")
-        logger.error(f"Full traceback: {error_details}")
-        
-        error_data = {
-            "error": {
-                "message": f"Stream error: {str(e)}",
-                "type": "internal_error"
-            }
-        }
-        yield f"data: {json.dumps(error_data, ensure_ascii=False)}\n\n"
-

 async def process_guidelines_and_terms(
    bot_id: str,
@ -275,7 +185,7 @@ async def process_guidelines_and_terms(
                logger.info(f"Non-JSON result from batch {i}: {result}")

        if all_checks:
-            guideline_analysis = "\n".join([item["rationale"] for item in all_checks])
+            guideline_analysis = "\n".join([item["condition"]+":"+item["rationale"] for item in all_checks])
            logger.info(f"Guideline analysis completed: {len(guideline_analysis)} chars")

    else:
@ -348,19 +258,8 @@ async def enhanced_generate_stream_response(
            preamble_text = await preamble_task
            # 只有当preamble_text不为空且不为"<empty>"时才输出
            if preamble_text and preamble_text.strip() and preamble_text != "<empty>":
-                chunk_data = {
-                    "id": f"chatcmpl-preamble",
-                    "object": "chat.completion.chunk",
-                    "created": int(__import__('time').time()),
-                    "model": model_name,
-                    "choices": [{
-                        "index": 0,
-                        "delta": {
-                            "content": get_content_from_messages([{"role": "assistant","content": preamble_text + "\n"}], tool_response=tool_response)
-                        },
-                        "finish_reason": None
-                    }]
-                }
+                preamble_content = get_content_from_messages([{"role": "assistant","content": preamble_text + "\n"}], tool_response=tool_response)
+                chunk_data = create_stream_chunk(f"chatcmpl-preamble", model_name, preamble_content)
                yield f"data: {json.dumps(chunk_data, ensure_ascii=False)}\n\n"
                logger.info(f"Stream mode: Generated preamble text ({len(preamble_text)} chars)")
            else:
@ -373,19 +272,8 @@ async def enhanced_generate_stream_response(

        # 立即发送guideline_analysis
        if guideline_analysis:
-            chunk_data = {
-                "id": f"chatcmpl-guideline",
-                "object": "chat.completion.chunk",
-                "created": int(__import__('time').time()),
-                "model": model_name,
-                "choices": [{
-                    "index": 0,
-                    "delta": {
-                        "content": get_content_from_messages([{"role": "assistant","reasoning_content": guideline_analysis+ "\n"}], tool_response=tool_response)
-                    },
-                    "finish_reason": None
-                }]
-            }
+            guideline_content = get_content_from_messages([{"role": "assistant","reasoning_content": guideline_analysis+ "\n"}], tool_response=tool_response)
+            chunk_data = create_stream_chunk(f"chatcmpl-guideline", model_name, guideline_content)
            yield f"data: {json.dumps(chunk_data, ensure_ascii=False)}\n\n"

        # 准备最终的消息
@ -415,33 +303,10 @@ async def enhanced_generate_stream_response(
                if chunk_id == 0:
                    logger.info(f"Agent首个Token已生成, 开始流式输出")
                chunk_id += 1
-                chunk_data = {
-                    "id": f"chatcmpl-{chunk_id}",
-                    "object": "chat.completion.chunk",
-                    "created": int(__import__('time').time()),
-                    "model": model_name,
-                    "choices": [{
-                        "index": 0,
-                        "delta": {
-                            "content": new_content
-                        },
-                        "finish_reason": None
-                    }]
-                }
+                chunk_data = create_stream_chunk(f"chatcmpl-{chunk_id}", model_name, new_content)
                yield f"data: {json.dumps(chunk_data, ensure_ascii=False)}\n\n"

-        # 发送最终完成标记
-        final_chunk = {
-            "id": f"chatcmpl-{chunk_id + 1}",
-            "object": "chat.completion.chunk",
-            "created": int(__import__('time').time()),
-            "model": model_name,
-            "choices": [{
-                "index": 0,
-                "delta": {},
-                "finish_reason": "stop"
-            }]
-        }
+        final_chunk = create_stream_chunk(f"chatcmpl-{chunk_id + 1}", model_name, finish_reason="stop")
        yield f"data: {json.dumps(final_chunk, ensure_ascii=False)}\n\n"

        # 发送结束标记
--- a/utils/fastapi_utils.py
+++ b/utils/fastapi_utils.py
@ -78,6 +78,20 @@ def get_versioned_filename(upload_dir: str, name_without_ext: str, file_extensio

    return versioned_filename, next_version

+def create_stream_chunk(chunk_id: str, model_name: str, content: str = None, finish_reason: str = None) -> dict:
+    """Create a standardized streaming response chunk"""
+    chunk_data = {
+        "id": chunk_id,
+        "object": "chat.completion.chunk",
+        "created": int(__import__('time').time()),
+        "model": model_name,
+        "choices": [{
+            "index": 0,
+            "delta": {"content": content} if content is not None else {},
+            "finish_reason": finish_reason
+        }]
+    }
+    return chunk_data

 def get_content_from_messages(messages: List[dict], tool_response: bool = True) -> str:
    """Extract content from qwen-agent messages with special formatting"""