ailine/app/backend.py

"""
FastAPI 后端 - 支持动态模型切换，使用 PostgreSQL 持久化记忆
采用依赖注入模式，优雅管理资源生命周期
"""

import os
import uuid
import json
from contextlib import asynccontextmanager

from dotenv import load_dotenv
from fastapi import FastAPI, HTTPException, WebSocket, WebSocketDisconnect, Depends, Request, Query
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import StreamingResponse
from pydantic import BaseModel
from langgraph.checkpoint.postgres.aio import AsyncPostgresSaver
from app.agent import AIAgentService
from app.history import ThreadHistoryService
from app.logger import debug, info, warning, error

# 加载 .env 文件
load_dotenv()

# PostgreSQL 连接字符串配置
# 优先级：环境变量 DB_URI > Docker 内部服务名 > 本地开发地址
DB_URI = os.getenv(
    "DB_URI",
    "postgresql://postgres:mysecretpassword@ai-postgres:5432/langgraph_db?sslmode=disable"
)


@asynccontextmanager
async def lifespan(app: FastAPI):
    """应用生命周期管理：创建并注入全局服务"""
    # 1. 创建数据库连接池并初始化表（仅 checkpointer）
    async with AsyncPostgresSaver.from_conn_string(DB_URI) as checkpointer:
        await checkpointer.setup()
        
        # 2. 构建 AI Agent 服务
        agent_service = AIAgentService(checkpointer)
        await agent_service.initialize()
        
        # 3. 创建历史查询服务
        history_service = ThreadHistoryService(checkpointer)
        
        # 4. 将服务实例存入 app.state
        app.state.agent_service = agent_service
        app.state.history_service = history_service
        
        # 应用运行中...
        yield
        
        # 5. 关闭时自动清理数据库连接（async with 负责）
        info("🛑 应用关闭，数据库连接池已释放")


app = FastAPI(lifespan=lifespan)

# CORS 中间件（允许前端跨域）
app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)


# ========== 健康检查端点 ==========
@app.get("/health")
async def health_check():
    """健康检查端点，用于 Docker 和 CI/CD 监控"""
    return {"status": "ok", "service": "ai-agent-backend"}


# ========== Pydantic 模型 ==========
class ChatRequest(BaseModel):
    message: str
    thread_id: str | None = None
    model: str = "zhipu"
    user_id: str = "default_user"


class ChatResponse(BaseModel):
    reply: str
    thread_id: str
    model_used: str
    input_tokens: int = 0
    output_tokens: int = 0
    total_tokens: int = 0
    elapsed_time: float = 0.0


# ========== 依赖注入函数 ==========
def get_agent_service(request: Request) -> AIAgentService:
    """从 app.state 中获取全局 AIAgentService 实例"""
    return request.app.state.agent_service


def get_history_service(request: Request) -> ThreadHistoryService:
    """从 app.state 中获取全局 ThreadHistoryService 实例"""
    return request.app.state.history_service


# ========== HTTP 端点 ==========
@app.post("/chat", response_model=ChatResponse)
async def chat_endpoint(
    request: ChatRequest,
    agent_service: AIAgentService = Depends(get_agent_service)
):
    """同步对话接口，支持模型选择"""
    if not request.message:
        raise HTTPException(status_code=400, detail="message required")

    thread_id = request.thread_id or str(uuid.uuid4())
    result = await agent_service.process_message(
        request.message, thread_id, request.model, request.user_id
    )
    
    # 提取 token 统计信息
    token_usage = result.get("token_usage", {})
    input_tokens = token_usage.get('prompt_tokens', token_usage.get('input_tokens', 0))
    output_tokens = token_usage.get('completion_tokens', token_usage.get('output_tokens', 0))
    elapsed_time = result.get("elapsed_time", 0.0)
    
    actual_model = request.model if request.model in agent_service.graphs else next(iter(agent_service.graphs.keys()))
    
    return ChatResponse(
        reply=result["reply"],
        thread_id=thread_id,
        model_used=actual_model,
        input_tokens=input_tokens,
        output_tokens=output_tokens,
        total_tokens=input_tokens + output_tokens,
        elapsed_time=elapsed_time
    )


# ========== 历史查询接口 ==========
@app.get("/threads")
async def list_threads(
    user_id: str = Query("default_user", description="用户 ID"),
    limit: int = Query(50, ge=1, le=200, description="返回数量限制"),
    history_service: ThreadHistoryService = Depends(get_history_service)
):
    """获取当前用户的对话历史列表"""
    threads = await history_service.get_user_threads(user_id, limit)
    return {"threads": threads}


@app.get("/thread/{thread_id}/messages")
async def get_thread_messages(
    thread_id: str,
    user_id: str = Query("default_user", description="用户 ID"),
    history_service: ThreadHistoryService = Depends(get_history_service)
):
    """获取指定线程的完整消息历史"""
    messages = await history_service.get_thread_messages(thread_id)
    return {"messages": messages}


@app.get("/thread/{thread_id}/summary")
async def get_thread_summary(
    thread_id: str,
    user_id: str = Query("default_user", description="用户 ID"),
    history_service: ThreadHistoryService = Depends(get_history_service)
):
    """获取指定线程的摘要信息"""
    summary = await history_service.get_thread_summary(thread_id)
    return summary


# ========== 流式对话接口 ==========
@app.post("/chat/stream")
async def chat_stream_endpoint(
    request: ChatRequest,
    agent_service: AIAgentService = Depends(get_agent_service)
):
    """流式对话接口（SSE）"""
    if not request.message:
        raise HTTPException(status_code=400, detail="message required")

    thread_id = request.thread_id or str(uuid.uuid4())
    
    async def event_generator():
        try:
            async for chunk in agent_service.process_message_stream(
                request.message, thread_id, request.model, request.user_id
            ):
                yield f"data: {json.dumps(chunk, ensure_ascii=False)}\n\n"
            yield "data: [DONE]\n\n"
        except Exception as e:
            error(f"流式响应异常: {e}")
            yield f"data: {json.dumps({'type': 'error', 'message': str(e)}, ensure_ascii=False)}\n\n"
            yield "data: [DONE]\n\n"
    
    return StreamingResponse(
        event_generator(),
        media_type="text/event-stream",
        headers={
            "Cache-Control": "no-cache",
            "Connection": "keep-alive",
            "X-Accel-Buffering": "no",  # 禁用 Nginx 缓冲
        }
    )


# ========== WebSocket 端点（可选） ==========
@app.websocket("/ws")
async def websocket_endpoint(
    websocket: WebSocket,
    agent_service: AIAgentService = Depends(get_agent_service)
):
    await websocket.accept()
    try:
        while True:
            data = await websocket.receive_json()
            message = data.get("message")
            thread_id = data.get("thread_id", str(uuid.uuid4()))
            model = data.get("model", "zhipu")
            user_id = data.get("user_id", "default_user")
            if not message:
                await websocket.send_json({"error": "missing message"})
                continue
            reply = await agent_service.process_message(message, thread_id, model, user_id)
            actual_model = model if model in agent_service.graphs else next(iter(agent_service.graphs.keys()))
            await websocket.send_json({"reply": reply, "thread_id": thread_id, "model_used": actual_model})
    except WebSocketDisconnect:
        pass


if __name__ == "__main__":
    import uvicorn
    # 使用环境变量或默认端口 8083（避免与 llama.cpp 的 8081 端口冲突）
    port = int(os.getenv("BACKEND_PORT", "8083"))
    uvicorn.run(app, host="0.0.0.0", port=port)
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								"""
 								FastAPI 后端 - 支持动态模型切换，使用 PostgreSQL 持久化记忆
 								采用依赖注入模式，优雅管理资源生命周期
 								"""
-												```
docs(quickstart): 更新快速开始文档以支持Nginx反向代理配置

- 修改环境变量配置方式，从直接创建.env文件改为复制模板文件
- 添加必需和可选配置项的详细说明
- 更新Docker Compose启动命令以使用正确的路径
- 增加Nginx反向代理访问方式的说明
- 为本地开发模式添加额外的数据库配置说明

fix(readme): 修正部署说明中的环境变量配置方法

- 将硬编码的环境变量配置改为使用模板文件复制方式
- 更新Docker Compose启动命令路径
- 补充Nginx反向代理访问说明
- 修正数据库配置注意事项

feat(backend): 支持从环境变量读取数据库连接配置

- 添加os模块导入
- 修改DB_URI配置逻辑，优先从环境变量读取
- 适配Docker和本地开发环境的不同数据库连接地址

refactor(docker): 优化Docker Compose配置支持Nginx代理

- 限制后端端口仅本机访问
- 修改前端API URL为相对路径，通过Nginx代理访问
- 限制前端端口仅本机访问

refactor(frontend): 适配Nginx反向代理后端API调用

- 将硬编码的后端API地址改为相对路径
- 支持通过Nginx代理转发请求到后端服务

chore(scripts): 更新启动脚本中的访问地址提示信息

- 修改前端启动成功后的访问地址提示
- 添加Nginx代理访问方式的说明
```

											
										
										
											2026-04-14 01:44:55 +08:00
+								import os
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								import uuid
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								import json
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								from contextlib import asynccontextmanager
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								from dotenv import load_dotenv
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								from fastapi import FastAPI, HTTPException, WebSocket, WebSocketDisconnect, Depends, Request, Query
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								from fastapi.middleware.cors import CORSMiddleware
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								from fastapi.responses import StreamingResponse
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								from pydantic import BaseModel
 								from langgraph.checkpoint.postgres.aio import AsyncPostgresSaver
-												```
docs(.gitignore/README/QUICKSTART): 更新文档和忽略配置

- 添加IDE配置、日志和数据文件到.gitignore
- 重构QUICKSTART.md，提供Docker Compose和本地开发两种部署方式
- 更新README.md，优化项目介绍和架构说明
- 移除旧的agent.py和backend.py文件
```

											
										
										
											2026-04-13 23:57:16 +08:00
+								from app.agent import AIAgentService
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								from app.history import ThreadHistoryService
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								from app.logger import debug, info, warning, error
 								# 加载 .env 文件
 								load_dotenv()
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								# PostgreSQL 连接字符串配置
 								# 优先级：环境变量 DB_URI > Docker 内部服务名 > 本地开发地址
-												```
docs(quickstart): 更新快速开始文档以支持Nginx反向代理配置

- 修改环境变量配置方式，从直接创建.env文件改为复制模板文件
- 添加必需和可选配置项的详细说明
- 更新Docker Compose启动命令以使用正确的路径
- 增加Nginx反向代理访问方式的说明
- 为本地开发模式添加额外的数据库配置说明

fix(readme): 修正部署说明中的环境变量配置方法

- 将硬编码的环境变量配置改为使用模板文件复制方式
- 更新Docker Compose启动命令路径
- 补充Nginx反向代理访问说明
- 修正数据库配置注意事项

feat(backend): 支持从环境变量读取数据库连接配置

- 添加os模块导入
- 修改DB_URI配置逻辑，优先从环境变量读取
- 适配Docker和本地开发环境的不同数据库连接地址

refactor(docker): 优化Docker Compose配置支持Nginx代理

- 限制后端端口仅本机访问
- 修改前端API URL为相对路径，通过Nginx代理访问
- 限制前端端口仅本机访问

refactor(frontend): 适配Nginx反向代理后端API调用

- 将硬编码的后端API地址改为相对路径
- 支持通过Nginx代理转发请求到后端服务

chore(scripts): 更新启动脚本中的访问地址提示信息

- 修改前端启动成功后的访问地址提示
- 添加Nginx代理访问方式的说明
```

											
										
										
											2026-04-14 01:44:55 +08:00
+								DB_URI = os.getenv(
 								    "DB_URI",
-												采用向量数据库实现长期记忆

											
										
										
											2026-04-15 23:52:13 +08:00
+								    "postgresql://postgres:mysecretpassword@ai-postgres:5432/langgraph_db?sslmode=disable"
-												```
docs(quickstart): 更新快速开始文档以支持Nginx反向代理配置

- 修改环境变量配置方式，从直接创建.env文件改为复制模板文件
- 添加必需和可选配置项的详细说明
- 更新Docker Compose启动命令以使用正确的路径
- 增加Nginx反向代理访问方式的说明
- 为本地开发模式添加额外的数据库配置说明

fix(readme): 修正部署说明中的环境变量配置方法

- 将硬编码的环境变量配置改为使用模板文件复制方式
- 更新Docker Compose启动命令路径
- 补充Nginx反向代理访问说明
- 修正数据库配置注意事项

feat(backend): 支持从环境变量读取数据库连接配置

- 添加os模块导入
- 修改DB_URI配置逻辑，优先从环境变量读取
- 适配Docker和本地开发环境的不同数据库连接地址

refactor(docker): 优化Docker Compose配置支持Nginx代理

- 限制后端端口仅本机访问
- 修改前端API URL为相对路径，通过Nginx代理访问
- 限制前端端口仅本机访问

refactor(frontend): 适配Nginx反向代理后端API调用

- 将硬编码的后端API地址改为相对路径
- 支持通过Nginx代理转发请求到后端服务

chore(scripts): 更新启动脚本中的访问地址提示信息

- 修改前端启动成功后的访问地址提示
- 添加Nginx代理访问方式的说明
```

											
										
										
											2026-04-14 01:44:55 +08:00
+								)
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
 								@asynccontextmanager
 								async def lifespan(app: FastAPI):
 								    """应用生命周期管理：创建并注入全局服务"""
-												采用向量数据库实现长期记忆

											
										
										
											2026-04-15 23:52:13 +08:00
+								    # 1. 创建数据库连接池并初始化表（仅 checkpointer）
 								    async with AsyncPostgresSaver.from_conn_string(DB_URI) as checkpointer:
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								        await checkpointer.setup()
 								        # 2. 构建 AI Agent 服务
-												采用向量数据库实现长期记忆

											
										
										
											2026-04-15 23:52:13 +08:00
+								        agent_service = AIAgentService(checkpointer)
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								        await agent_service.initialize()
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								        # 3. 创建历史查询服务
 								        history_service = ThreadHistoryService(checkpointer)
 								        # 4. 将服务实例存入 app.state
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								        app.state.agent_service = agent_service
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								        app.state.history_service = history_service
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
 								        # 应用运行中...
 								        yield
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								        # 5. 关闭时自动清理数据库连接（async with 负责）
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								        info("🛑 应用关闭，数据库连接池已释放")
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
 								app = FastAPI(lifespan=lifespan)
 								# CORS 中间件（允许前端跨域）
 								app.add_middleware(
 								    CORSMiddleware,
 								    allow_origins=["*"],
 								    allow_credentials=True,
 								    allow_methods=["*"],
 								    allow_headers=["*"],
 								)
-												fix: 添加健康检查端点和 Secrets 验证步骤

											
										
										
											2026-04-14 02:02:42 +08:00
+								# ========== 健康检查端点 ==========
 								@app.get("/health")
 								async def health_check():
 								    """健康检查端点，用于 Docker 和 CI/CD 监控"""
 								    return {"status": "ok", "service": "ai-agent-backend"}
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								# ========== Pydantic 模型 ==========
 								class ChatRequest(BaseModel):
 								    message: str
 								    thread_id: str | None = None
 								    model: str = "zhipu"
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								    user_id: str = "default_user"
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
 								class ChatResponse(BaseModel):
 								    reply: str
 								    thread_id: str
 								    model_used: str
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								    input_tokens: int = 0
 								    output_tokens: int = 0
 								    total_tokens: int = 0
 								    elapsed_time: float = 0.0
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
 								# ========== 依赖注入函数 ==========
 								def get_agent_service(request: Request) -> AIAgentService:
 								    """从 app.state 中获取全局 AIAgentService 实例"""
 								    return request.app.state.agent_service
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								def get_history_service(request: Request) -> ThreadHistoryService:
 								    """从 app.state 中获取全局 ThreadHistoryService 实例"""
 								    return request.app.state.history_service
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								# ========== HTTP 端点 ==========
 								@app.post("/chat", response_model=ChatResponse)
 								async def chat_endpoint(
 								    request: ChatRequest,
 								    agent_service: AIAgentService = Depends(get_agent_service)
 								):
 								    """同步对话接口，支持模型选择"""
 								    if not request.message:
 								        raise HTTPException(status_code=400, detail="message required")
 								    thread_id = request.thread_id or str(uuid.uuid4())
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								    result = await agent_service.process_message(
 								        request.message, thread_id, request.model, request.user_id
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								    )
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
 								    # 提取 token 统计信息
 								    token_usage = result.get("token_usage", {})
 								    input_tokens = token_usage.get('prompt_tokens', token_usage.get('input_tokens', 0))
 								    output_tokens = token_usage.get('completion_tokens', token_usage.get('output_tokens', 0))
 								    elapsed_time = result.get("elapsed_time", 0.0)
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								    actual_model = request.model if request.model in agent_service.graphs else next(iter(agent_service.graphs.keys()))
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
 								    return ChatResponse(
 								        reply=result["reply"],
 								        thread_id=thread_id,
 								        model_used=actual_model,
 								        input_tokens=input_tokens,
 								        output_tokens=output_tokens,
 								        total_tokens=input_tokens + output_tokens,
 								        elapsed_time=elapsed_time
 								    )
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
-												前端修改

											
										
										
											2026-04-16 03:21:38 +08:00
+								# ========== 历史查询接口 ==========
 								@app.get("/threads")
 								async def list_threads(
 								    user_id: str = Query("default_user", description="用户 ID"),
 								    limit: int = Query(50, ge=1, le=200, description="返回数量限制"),
 								    history_service: ThreadHistoryService = Depends(get_history_service)
 								):
 								    """获取当前用户的对话历史列表"""
 								    threads = await history_service.get_user_threads(user_id, limit)
 								    return {"threads": threads}
 								@app.get("/thread/{thread_id}/messages")
 								async def get_thread_messages(
 								    thread_id: str,
 								    user_id: str = Query("default_user", description="用户 ID"),
 								    history_service: ThreadHistoryService = Depends(get_history_service)
 								):
 								    """获取指定线程的完整消息历史"""
 								    messages = await history_service.get_thread_messages(thread_id)
 								    return {"messages": messages}
 								@app.get("/thread/{thread_id}/summary")
 								async def get_thread_summary(
 								    thread_id: str,
 								    user_id: str = Query("default_user", description="用户 ID"),
 								    history_service: ThreadHistoryService = Depends(get_history_service)
 								):
 								    """获取指定线程的摘要信息"""
 								    summary = await history_service.get_thread_summary(thread_id)
 								    return summary
 								# ========== 流式对话接口 ==========
 								@app.post("/chat/stream")
 								async def chat_stream_endpoint(
 								    request: ChatRequest,
 								    agent_service: AIAgentService = Depends(get_agent_service)
 								):
 								    """流式对话接口（SSE）"""
 								    if not request.message:
 								        raise HTTPException(status_code=400, detail="message required")
 								    thread_id = request.thread_id or str(uuid.uuid4())
 								    async def event_generator():
 								        try:
 								            async for chunk in agent_service.process_message_stream(
 								                request.message, thread_id, request.model, request.user_id
 								            ):
 								                yield f"data: {json.dumps(chunk, ensure_ascii=False)}\n\n"
 								            yield "data: [DONE]\n\n"
 								        except Exception as e:
 								            error(f"流式响应异常: {e}")
 								            yield f"data: {json.dumps({'type': 'error', 'message': str(e)}, ensure_ascii=False)}\n\n"
 								            yield "data: [DONE]\n\n"
 								    return StreamingResponse(
 								        event_generator(),
 								        media_type="text/event-stream",
 								        headers={
 								            "Cache-Control": "no-cache",
 								            "Connection": "keep-alive",
 								            "X-Accel-Buffering": "no",  # 禁用 Nginx 缓冲
 								        }
 								    )
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								# ========== WebSocket 端点（可选） ==========
 								@app.websocket("/ws")
 								async def websocket_endpoint(
 								    websocket: WebSocket,
 								    agent_service: AIAgentService = Depends(get_agent_service)
 								):
 								    await websocket.accept()
 								    try:
 								        while True:
 								            data = await websocket.receive_json()
 								            message = data.get("message")
 								            thread_id = data.get("thread_id", str(uuid.uuid4()))
 								            model = data.get("model", "zhipu")
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								            user_id = data.get("user_id", "default_user")
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								            if not message:
 								                await websocket.send_json({"error": "missing message"})
 								                continue
-												添加长期记忆

											
										
										
											2026-04-14 17:34:12 +08:00
+								            reply = await agent_service.process_message(message, thread_id, model, user_id)
-												实现前后端分离的agent

											
										
										
											2026-04-13 19:49:18 +08:00
+								            actual_model = model if model in agent_service.graphs else next(iter(agent_service.graphs.keys()))
 								            await websocket.send_json({"reply": reply, "thread_id": thread_id, "model_used": actual_model})
 								    except WebSocketDisconnect:
 								        pass
 								if __name__ == "__main__":
 								    import uvicorn
-												修改端口信息

											
										
										
											2026-04-16 00:31:33 +08:00
+								    # 使用环境变量或默认端口 8083（避免与 llama.cpp 的 8081 端口冲突）
 								    port = int(os.getenv("BACKEND_PORT", "8083"))
-												采用向量数据库实现长期记忆

											
										
										
											2026-04-15 23:52:13 +08:00
+								    uvicorn.run(app, host="0.0.0.0", port=port)