ailine/backend/app/main_graph/nodes/hybrid_router.py

"""
混合路由节点模块 - 前置路由决策
负责决定走快速路径还是 React 循环
"""

import re
import json
from typing import Optional
from dataclasses import dataclass, field
from datetime import datetime
from langchain_core.runnables.config import RunnableConfig

from ..state import MainGraphState
from backend.app.logger import info, debug
from ...model_services.chat_services import get_small_llm_service
from ._utils import dispatch_custom_event
from backend.app.core.json_parser import extract_and_parse_json, safe_get, safe_get_float, safe_get_str


# ========== 核心数据类型 ==========
@dataclass
class HybridRouterResult:
    """混合路由结果"""
    intent: str = "complex"  # chitchat / knowledge / tool / complex
    confidence: float = 0.0
    suggested_tools: list = field(default_factory=list)
    path: str = "react_loop"  # fast_chitchat / fast_rag / fast_tool / react_loop
    reasoning: str = ""


# ========== 规则配置 ==========
CHITCHAT_KEYWORDS = {
    "你好", "您好", "hi", "hello", "hey", "早上好", "晚上好", "下午好",
    "谢谢", "感谢", "多谢", "thanks", "thank you",
    "再见", "拜拜", "goodbye", "bye"
}

SUBGRAPH_KEYWORDS = {
    "contact": ["通讯录", "联系人", "contact", "email", "邮件", "邮箱"],
    "dictionary": ["词典", "单词", "翻译", "dictionary", "translate", "生词"],
    "news_analysis": ["资讯", "新闻", "分析", "news", "report", "热点"]
}


# ========== 意图分类 Prompt 模板 ==========
INTENT_CLASSIFICATION_PROMPT = """你是一个专业的意图分类助手。请分析用户的查询，并输出 JSON 格式的结果。

【格式要求】
你必须严格输出 JSON 格式，不要加任何 Markdown 代码块标记（如 ```json）。
仅输出纯 JSON 字符串，不要有其他解释文字。

【意图类型（4选一）：
- chitchat: 闲聊、问候、感谢、道别（不需要工具）
- knowledge: 知识查询（需要查询知识库）
- tool: 工具操作（需要调用通讯录/词典/新闻等子图）
- complex: 复杂任务（多步骤、不确定、或需要推理）

【输出格式】
{{
    "intent": "chitchat|knowledge|tool|complex",
    "confidence": 0.85,
    "reasoning": "简要说明理由",
    "suggested_tools": ["contact|dictionary|news_analysis", "other"]
}}

【重要提示】
- 如果不能100%确定意图，请选择 "complex"，置信度设低一些。
- confidence 是你对当前分类的信心（0.0-1.0）。
- suggested_tools 仅在 intent=tool 时提供，否则设为空数组。

【用户查询】
{query}

【现在开始】
请根据以上信息，输出你的分类 JSON："""


# ========== 规则分流（<5ms） ==========
def _rule_based_redirect(query: str) -> Optional[HybridRouterResult]:
    """规则分流：处理明显不需要推理的情况"""
    query_clean = query.strip().lower()

    # 1. 闲聊
    if query_clean in CHITCHAT_KEYWORDS or any(kw in query_clean for kw in CHITCHAT_KEYWORDS):
        return HybridRouterResult(
            intent="chitchat",
            confidence=1.0,
            path="fast_chitchat",
            reasoning="规则匹配：闲聊类请求"
        )

    # 2. 子图关键词
    for subgraph_name, keywords in SUBGRAPH_KEYWORDS.items():
        if any(kw in query_clean for kw in keywords):
            return HybridRouterResult(
                intent="tool",
                confidence=0.9,
                suggested_tools=[subgraph_name],
                path="fast_tool",
                reasoning=f"规则匹配：{subgraph_name} 子图关键词"
            )

    # 3. 短问题
    if len(query_clean) < 3 or (query_clean.endswith("?") and len(query_clean) < 5):
        return HybridRouterResult(
            intent="complex",
            confidence=0.3,
            path="react_loop",
            reasoning="规则匹配：问题过于简短"
        )

    return None


# ========== LLM 分类 ==========
async def _classify_with_llm(query: str) -> HybridRouterResult:
    """使用轻量级 LLM 进行意图分类"""
    try:
        llm = get_small_llm_service()
        prompt = INTENT_CLASSIFICATION_PROMPT.format(query=query)
        response = await llm.ainvoke(prompt)

        # 使用新的 JSON 解析器
        parse_result = extract_and_parse_json(response.content)
        if not parse_result.success or not parse_result.data:
            return _default_result()

        return _parse_classification_result(parse_result.data)

    except Exception as e:
        debug(f"LLM 分类失败: {e}")
        return _default_result()


def _parse_classification_result(data: dict) -> HybridRouterResult:
    """解析分类结果"""
    intent = safe_get_str(data, "intent", "complex")
    confidence = safe_get_float(data, "confidence", 0.3)
    suggested_tools = safe_get(data, "suggested_tools", [])
    reasoning = safe_get_str(data, "reasoning", "")

    # 置信度低于阈值，走 complex
    if confidence < 0.5:
        intent = "complex"

    # intent -> path 映射
    path_map = {
        "chitchat": "fast_chitchat",
        "knowledge": "fast_rag",
        "tool": "fast_tool",
    }

    return HybridRouterResult(
        intent=intent,
        confidence=confidence,
        suggested_tools=suggested_tools,
        path=path_map.get(intent, "react_loop"),
        reasoning=reasoning
    )


def _default_result() -> HybridRouterResult:
    """默认结果（LLM 失败时）"""
    return HybridRouterResult(
        intent="complex",
        confidence=0.3,
        path="react_loop",
        reasoning="LLM 调用失败，降级到 React 循环"
    )


# ========== 主路由节点 ==========
async def hybrid_router_node(state: MainGraphState, config: Optional[RunnableConfig] = None) -> MainGraphState:
    """混合路由节点：前置路由，决定走快速路径还是 React 循环"""
    state.current_phase = "hybrid_router"
    query = state.user_query or ""

    info(f"[Hybrid Router] 开始路由: {query[:50]}...")

    # 1. 规则分流
    rule_result = _rule_based_redirect(query)
    if rule_result:
        decision = rule_result
        info(f"[Hybrid Router] 规则命中: {decision.path}")
    else:
        # 2. LLM 分类
        info("[Hybrid Router] 规则未命中，使用 LLM 分类")
        decision = await _classify_with_llm(query)

    # 步骤3: 更新状态 - 只使用新的结构化字段
    state.hybrid_router.decision = decision
    state.hybrid_router.start_time = datetime.now().isoformat()

    # 4. 发送事件
    await dispatch_custom_event("intent_classified", {
        "intent": decision.intent,
        "confidence": decision.confidence,
        "reasoning": decision.reasoning,
        "suggested_tools": decision.suggested_tools
    }, config)

    await dispatch_custom_event("path_decision", {
        "path": decision.path,
        "intent": decision.intent,
        "reasoning": decision.reasoning
    }, config)

    info(f"[Hybrid Router] 路由决策: {decision.path} (intent={decision.intent}, confidence={decision.confidence})")
    return state


# ========== 条件路由函数 ==========
def route_from_hybrid_decision(state: MainGraphState) -> str:
    """从混合路由决策获取下一步节点 - 使用新的结构化字段"""
    decision = state.hybrid_router.decision
    if decision and hasattr(decision, 'path'):
        return decision.path
    return "react_loop"


def check_fast_path_success(state: MainGraphState) -> str:
    """检查快速路径是否成功 - 使用新的结构化字段"""
    if state.fast_path.failed:
        info("[Fast Path Check] 快速路径失败，升级到 React 循环")
        return "escalate"
    
    info("[Fast Path Check] 快速路径成功，进入 llm_call")
    return "llm_call"


# ========== 导出 ==========
__all__ = [
    "hybrid_router_node",
    "route_from_hybrid_decision",
    "check_fast_path_success",
    "HybridRouterResult",
]
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								"""
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								混合路由节点模块 - 前置路由决策
 								负责决定走快速路径还是 React 循环
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								"""
 								import re
 								import json
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								from typing import Optional
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								from dataclasses import dataclass, field
 								from datetime import datetime
-												导入方式修改

											
										
										
											2026-05-05 23:17:00 +08:00
+								from langchain_core.runnables.config import RunnableConfig
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												fix: 修复 RAG 无限循环问题和导入错误

主要修复：
1. 修复 RAG 推理无限循环问题（大小写不匹配 + 缺少已检索结果检查）
2. 修复 intent_classifier.py 的绝对导入错误
3. 删除旧的 start.sh 脚本，添加新的启动脚本
4. 优化路由逻辑和状态管理

											
										
										
											2026-05-04 18:59:15 +08:00
+								from ..state import MainGraphState
-												添加rag置信度判断

											
										
										
											2026-05-06 01:15:52 +08:00
+								from backend.app.logger import info, debug
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								from ...model_services.chat_services import get_small_llm_service
 								from ._utils import dispatch_custom_event
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								from backend.app.core.json_parser import extract_and_parse_json, safe_get, safe_get_float, safe_get_str
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
 								# ========== 核心数据类型 ==========
 								@dataclass
 								class HybridRouterResult:
 								    """混合路由结果"""
 								    intent: str = "complex"  # chitchat / knowledge / tool / complex
 								    confidence: float = 0.0
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    suggested_tools: list = field(default_factory=list)
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    path: str = "react_loop"  # fast_chitchat / fast_rag / fast_tool / react_loop
 								    reasoning: str = ""
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								# ========== 规则配置 ==========
 								CHITCHAT_KEYWORDS = {
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    "你好", "您好", "hi", "hello", "hey", "早上好", "晚上好", "下午好",
 								    "谢谢", "感谢", "多谢", "thanks", "thank you",
 								    "再见", "拜拜", "goodbye", "bye"
 								}
 								SUBGRAPH_KEYWORDS = {
 								    "contact": ["通讯录", "联系人", "contact", "email", "邮件", "邮箱"],
 								    "dictionary": ["词典", "单词", "翻译", "dictionary", "translate", "生词"],
 								    "news_analysis": ["资讯", "新闻", "分析", "news", "report", "热点"]
 								}
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								# ========== 意图分类 Prompt 模板 ==========
 								INTENT_CLASSIFICATION_PROMPT = """你是一个专业的意图分类助手。请分析用户的查询，并输出 JSON 格式的结果。
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								【格式要求】
 								你必须严格输出 JSON 格式，不要加任何 Markdown 代码块标记（如 ```json）。
 								仅输出纯 JSON 字符串，不要有其他解释文字。
 								【意图类型（4选一）：
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								- chitchat: 闲聊、问候、感谢、道别（不需要工具）
 								- knowledge: 知识查询（需要查询知识库）
 								- tool: 工具操作（需要调用通讯录/词典/新闻等子图）
 								- complex: 复杂任务（多步骤、不确定、或需要推理）
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								【输出格式】
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								{{
 								    "intent": "chitchat|knowledge|tool|complex",
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								    "confidence": 0.85,
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    "reasoning": "简要说明理由",
 								    "suggested_tools": ["contact|dictionary|news_analysis", "other"]
 								}}
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								【重要提示】
 								- 如果不能100%确定意图，请选择 "complex"，置信度设低一些。
 								- confidence 是你对当前分类的信心（0.0-1.0）。
 								- suggested_tools 仅在 intent=tool 时提供，否则设为空数组。
 								【用户查询】
 								{query}
 								【现在开始】
 								请根据以上信息，输出你的分类 JSON："""
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								# ========== 规则分流（<5ms） ==========
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								def _rule_based_redirect(query: str) -> Optional[HybridRouterResult]:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    """规则分流：处理明显不需要推理的情况"""
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    query_clean = query.strip().lower()
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								    # 1. 闲聊
 								    if query_clean in CHITCHAT_KEYWORDS or any(kw in query_clean for kw in CHITCHAT_KEYWORDS):
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								        return HybridRouterResult(
 								            intent="chitchat",
 								            confidence=1.0,
 								            path="fast_chitchat",
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								            reasoning="规则匹配：闲聊类请求"
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								        )
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								    # 2. 子图关键词
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    for subgraph_name, keywords in SUBGRAPH_KEYWORDS.items():
 								        if any(kw in query_clean for kw in keywords):
 								            return HybridRouterResult(
 								                intent="tool",
 								                confidence=0.9,
 								                suggested_tools=[subgraph_name],
 								                path="fast_tool",
 								                reasoning=f"规则匹配：{subgraph_name} 子图关键词"
 								            )
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								    # 3. 短问题
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    if len(query_clean) < 3 or (query_clean.endswith("?") and len(query_clean) < 5):
 								        return HybridRouterResult(
 								            intent="complex",
 								            confidence=0.3,
 								            path="react_loop",
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								            reasoning="规则匹配：问题过于简短"
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								        )
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    return None
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								# ========== LLM 分类 ==========
 								async def _classify_with_llm(query: str) -> HybridRouterResult:
 								    """使用轻量级 LLM 进行意图分类"""
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    try:
 								        llm = get_small_llm_service()
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        prompt = INTENT_CLASSIFICATION_PROMPT.format(query=query)
 								        response = await llm.ainvoke(prompt)
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								        # 使用新的 JSON 解析器
 								        parse_result = extract_and_parse_json(response.content)
 								        if not parse_result.success or not parse_result.data:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								            return _default_result()
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								        return _parse_classification_result(parse_result.data)
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
 								    except Exception as e:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        debug(f"LLM 分类失败: {e}")
 								        return _default_result()
 								def _parse_classification_result(data: dict) -> HybridRouterResult:
 								    """解析分类结果"""
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								    intent = safe_get_str(data, "intent", "complex")
 								    confidence = safe_get_float(data, "confidence", 0.3)
 								    suggested_tools = safe_get(data, "suggested_tools", [])
 								    reasoning = safe_get_str(data, "reasoning", "")
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								    # 置信度低于阈值，走 complex
 								    if confidence < 0.5:
 								        intent = "complex"
 								    # intent -> path 映射
 								    path_map = {
 								        "chitchat": "fast_chitchat",
 								        "knowledge": "fast_rag",
 								        "tool": "fast_tool",
 								    }
 								    return HybridRouterResult(
 								        intent=intent,
 								        confidence=confidence,
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								        suggested_tools=suggested_tools,
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        path=path_map.get(intent, "react_loop"),
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								        reasoning=reasoning
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    )
 								def _default_result() -> HybridRouterResult:
 								    """默认结果（LLM 失败时）"""
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    return HybridRouterResult(
 								        intent="complex",
 								        confidence=0.3,
 								        path="react_loop",
 								        reasoning="LLM 调用失败，降级到 React 循环"
 								    )
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								# ========== 主路由节点 ==========
-												导入方式修改

											
										
										
											2026-05-05 23:17:00 +08:00
+								async def hybrid_router_node(state: MainGraphState, config: Optional[RunnableConfig] = None) -> MainGraphState:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    """混合路由节点：前置路由，决定走快速路径还是 React 循环"""
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    state.current_phase = "hybrid_router"
 								    query = state.user_query or ""
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    info(f"[Hybrid Router] 开始路由: {query[:50]}...")
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
 								    # 1. 规则分流
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    rule_result = _rule_based_redirect(query)
 								    if rule_result:
 								        decision = rule_result
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        info(f"[Hybrid Router] 规则命中: {decision.path}")
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    else:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        # 2. LLM 分类
 								        info("[Hybrid Router] 规则未命中，使用 LLM 分类")
 								        decision = await _classify_with_llm(query)
-												重构：移除对 debug_info 的依赖，只使用新的结构化状态字段

											
										
										
											2026-05-06 14:45:40 +08:00
+								    # 步骤3: 更新状态 - 只使用新的结构化字段
-												重构：增强 JSON 解析稳定性，优化 Prompt，改进状态结构

主要改进：

1. 新增 json_parser.py - 统一的 JSON 解析工具
   - 支持多种格式（纯 JSON、markdown、文本中的 JSON）
   - 多层 fallback 策略
   - 安全的字段提取函数

2. 优化 intent.py 和 hybrid_router.py
   - 使用新的 json_parser
   - 优化 Prompt，更清晰的格式要求
   - 更好的错误处理

3. 改进 state.py - 新增结构化状态字段
   - ReactReasoningState、HybridRouterState、FastPathState
   - 向后兼容旧的 debug_info

4. 更新各节点模块 - 同时更新旧字段保持兼容
   - reasoning.py - 更新 state.react_reasoning
   - hybrid_router.py - 更新 state.hybrid_router
   - fast_paths.py - 更新 state.fast_path

											
										
										
											2026-05-06 13:34:32 +08:00
+								    state.hybrid_router.decision = decision
 								    state.hybrid_router.start_time = datetime.now().isoformat()
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    # 4. 发送事件
 								    await dispatch_custom_event("intent_classified", {
 								        "intent": decision.intent,
 								        "confidence": decision.confidence,
 								        "reasoning": decision.reasoning,
 								        "suggested_tools": decision.suggested_tools
 								    }, config)
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    await dispatch_custom_event("path_decision", {
 								        "path": decision.path,
 								        "intent": decision.intent,
 								        "reasoning": decision.reasoning
 								    }, config)
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    info(f"[Hybrid Router] 路由决策: {decision.path} (intent={decision.intent}, confidence={decision.confidence})")
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								    return state
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								# ========== 条件路由函数 ==========
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								def route_from_hybrid_decision(state: MainGraphState) -> str:
-												重构：移除对 debug_info 的依赖，只使用新的结构化状态字段

											
										
										
											2026-05-06 14:45:40 +08:00
+								    """从混合路由决策获取下一步节点 - 使用新的结构化字段"""
 								    decision = state.hybrid_router.decision
 								    if decision and hasattr(decision, 'path'):
 								        return decision.path
 								    return "react_loop"
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
 								def check_fast_path_success(state: MainGraphState) -> str:
-												重构：继续移除对 debug_info 的依赖，主要模块已完成迁移

											
										
										
											2026-05-06 14:47:51 +08:00
+								    """检查快速路径是否成功 - 使用新的结构化字段"""
 								    if state.fast_path.failed:
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								        info("[Fast Path Check] 快速路径失败，升级到 React 循环")
-												✨ 完整的混合路由优化系统

1. 双模型服务 (llm + smallLLM)
   - 增加 get_small_llm_service() 函数
   - 支持智谱/DeepSeek 小模型作为轻量级选项

2. 前置混合路由
   - 规则快速分流（无 LLM，超快速）
   - 轻量级意图分类（smallLLM）
   - 快速路径：fast_chitchat, fast_rag, fast_tool

3. 自动升级机制
   - 快速路径失败 → 自动回到 React 循环
   - SSE 事件增强：intent_classified, path_decision, fast_path_*, escalation

4. 向后兼容
   - build_react_main_graph(use_hybrid_router=True/False)
   - 可选择启用或禁用混合路由

5. 更新 intent.py
   - 支持 use_small_llm 参数
   - 保留原有完整功能供 React 循环使用

											
										
										
											2026-05-03 16:45:46 +08:00
+								        return "escalate"
-												重构：继续移除对 debug_info 的依赖，主要模块已完成迁移

											
										
										
											2026-05-06 14:47:51 +08:00
-												refactor: 重构快速路径流程，统一通过 llm_call 输出

- 重构 fast_paths.py，让 fast_chitchat 和 fast_rag 都进入 llm_call 而不是直接设置 final_result
- 修改 check_fast_path_success 函数返回 'llm_call' 而不是 'success'
- 更新 main_graph_builder.py 的条件边配置，支持路由到 llm_call
- 在快速路径节点中添加清除 state.final_result 的逻辑，避免复用旧结果
- 重构 RAG 工具初始化方式，使用模块级变量管理
- 修改 finalize.py 让它返回 final_result
- 更新 agent_service.py 的 RAG 工具注入方式
- 简化 hybrid_router.py 的代码结构
- 清理 rag_nodes.py 的全局变量相关代码
- 更新相关测试文件

											
										
										
											2026-05-05 04:32:42 +08:00
+								    info("[Fast Path Check] 快速路径成功，进入 llm_call")
 								    return "llm_call"
 								# ========== 导出 ==========
 								__all__ = [
 								    "hybrid_router_node",
 								    "route_from_hybrid_decision",
 								    "check_fast_path_success",
 								    "HybridRouterResult",
 								]