feat(agent-core): 补齐提示词编排与结构化解析

2026-05-30 00:20:40 +08:00
parent ba3f5fc584
commit df45a89eb1
5 changed files with 421 additions and 29 deletions
--- a/agent_core/orchestrator.py
+++ b/agent_core/orchestrator.py
@@ -1,40 +1,153 @@
+import json
 import time

+from .llm_provider import create_llm_provider, get_runtime_llm_config
 from .results import AgentResult
-from .structured_output import build_mock_structured_output
+from .structured_output import (
+    build_response_schema_hint,
+    extract_answer_from_structured_output,
+    parse_structured_output,
+)
 from .tool_registry import run_declared_tools
 from .rag.retriever import retrieve


 def run_agent(scenario_config: dict, user_input: str, options: dict | None = None) -> AgentResult:
+    """
+    执行当前场景的最小 Agent 闭环。
+
+    处理顺序保持和设计文档一致：
+    1. 读取场景配置
+    2. 执行 RAG 检索
+    3. 执行声明式工具
+    4. 构造 Prompt 并调用 LLM
+    5. 解析结构化结果
+    6. 统一返回 AgentResult
+    """
    started_at = time.perf_counter()
    options = options or {}
    output_type = scenario_config.get("output", {}).get("type", "general_answer")

-    references = []
-    rag_config = scenario_config.get("rag", {})
-    if rag_config.get("enabled"):
-        references = retrieve(
-            scenario_id=scenario_config.get("id", ""),
-            query=user_input,
-            collection=rag_config.get("collection", scenario_config.get("id", "")),
-            top_k=rag_config.get("top_k", 5),
-            document_ids=options.get("document_ids"),
-            store_path=options.get("rag_store_path"),
-        )
-
+    references = _collect_references(scenario_config=scenario_config, user_input=user_input, options=options)
    tool_calls = run_declared_tools(scenario_config.get("tools", []), user_input)
-    structured_output = build_mock_structured_output(output_type, user_input, references)
-    answer = f"已根据「{scenario_config.get('name', '当前场景')}」生成模拟回答：{user_input}"
+    messages = build_messages(
+        scenario_config=scenario_config,
+        user_input=user_input,
+        references=references,
+        tool_calls=tool_calls,
+    )
+
+    provider = options.get("llm_provider") or create_llm_provider(
+        get_runtime_llm_config(options.get("llm_config"))
+    )
+    llm_response = provider.generate(
+        messages,
+        response_format=build_response_schema_hint(output_type),
+    )
    latency_ms = int((time.perf_counter() - started_at) * 1000)

+    if not llm_response.success:
+        return AgentResult(
+            answer="模型调用失败，请检查配置或稍后重试。",
+            structured_output={},
+            references=references,
+            tool_calls=tool_calls,
+            raw_output="",
+            model_name=llm_response.model_name or "unknown-model",
+            latency_ms=latency_ms,
+            status="failed",
+            error=str(llm_response.error or "未知模型错误"),
+        )
+
+    structured_output, _ = parse_structured_output(llm_response.content, output_type)
+    answer = extract_answer_from_structured_output(structured_output, llm_response.content)
    return AgentResult(
        answer=answer,
        structured_output=structured_output,
        references=references,
        tool_calls=tool_calls,
-        raw_output=answer,
-        model_name=options.get("model_name", "mock-model"),
+        raw_output=llm_response.content,
+        model_name=llm_response.model_name or "unknown-model",
        latency_ms=latency_ms,
        status="success",
    )
+
+
+def build_messages(
+    scenario_config: dict,
+    user_input: str,
+    references: list[dict],
+    tool_calls: list[dict],
+) -> list[dict]:
+    """将场景配置、检索结果和工具结果整合为最小可解释 Prompt。"""
+    agent_config = scenario_config.get("agent", {})
+    system_message = "\n".join(
+        [
+            f"你当前扮演的角色：{agent_config.get('role', '通用业务助手')}",
+            f"当前任务目标：{agent_config.get('goal', '根据输入生成结构化结果')}",
+            "执行要求：",
+            _format_instructions(agent_config.get("instructions", [])),
+            f"输出类型：{scenario_config.get('output', {}).get('type', 'general_answer')}",
+            "请优先输出 JSON 对象，字段必须贴近约定输出结构。",
+        ]
+    )
+    context_message = "\n".join(
+        [
+            f"当前场景：{scenario_config.get('name', '未命名场景')}",
+            _format_references(references),
+            _format_tool_calls(tool_calls),
+        ]
+    )
+    return [
+        {"role": "system", "content": system_message},
+        {"role": "assistant", "content": context_message},
+        {"role": "user", "content": user_input},
+    ]
+
+
+def _collect_references(scenario_config: dict, user_input: str, options: dict) -> list[dict]:
+    """按场景配置执行检索，并保持无 RAG 场景也能正常返回空列表。"""
+    rag_config = scenario_config.get("rag", {})
+    if not rag_config.get("enabled"):
+        return []
+    return retrieve(
+        scenario_id=scenario_config.get("id", ""),
+        query=user_input,
+        collection=rag_config.get("collection", scenario_config.get("id", "")),
+        top_k=rag_config.get("top_k", 5),
+        document_ids=options.get("document_ids"),
+        store_path=options.get("rag_store_path"),
+    )
+
+
+def _format_instructions(instructions: list[str]) -> str:
+    if not instructions:
+        return "1. 结合知识库和工具结果回答。\n2. 信息不足时明确说明。"
+    return "\n".join(f"{index}. {item}" for index, item in enumerate(instructions, start=1))
+
+
+def _format_references(references: list[dict]) -> str:
+    if not references:
+        return "知识库引用：当前没有检索到可用片段。"
+    lines = ["知识库引用："]
+    for index, reference in enumerate(references, start=1):
+        lines.append(
+            f"{index}. 来源={reference.get('source', '未知来源')} 内容={reference.get('content', '')}"
+        )
+    return "\n".join(lines)
+
+
+def _format_tool_calls(tool_calls: list[dict]) -> str:
+    if not tool_calls:
+        return "工具结果：当前场景未声明工具或无需调用工具。"
+    lines = ["工具结果："]
+    for index, tool_call in enumerate(tool_calls, start=1):
+        if tool_call.get("success"):
+            lines.append(
+                f"{index}. 工具={tool_call.get('tool_name')} 结果={json.dumps(tool_call.get('result', {}), ensure_ascii=False)}"
+            )
+        else:
+            lines.append(
+                f"{index}. 工具={tool_call.get('tool_name')} 失败={tool_call.get('error', '未知错误')}"
+            )
+    return "\n".join(lines)