2025-10-30 11:14:43 +08:00
|
|
|
|
"""AI服务封装 - 统一的OpenAI和Claude接口"""
|
|
|
|
|
|
from typing import Optional, AsyncGenerator, List, Dict, Any
|
|
|
|
|
|
from openai import AsyncOpenAI
|
|
|
|
|
|
from anthropic import AsyncAnthropic
|
2025-10-30 16:53:50 +08:00
|
|
|
|
from app.config import settings as app_settings
|
2025-10-30 11:14:43 +08:00
|
|
|
|
from app.logger import get_logger
|
2025-11-24 11:30:27 +08:00
|
|
|
|
from app.mcp.adapters import UniversalMCPAdapter, PromptInjectionAdapter
|
2025-10-30 11:14:43 +08:00
|
|
|
|
import httpx
|
2025-11-07 22:14:20 +08:00
|
|
|
|
import json
|
2025-11-22 18:23:30 +08:00
|
|
|
|
import hashlib
|
2025-12-14 15:21:52 +08:00
|
|
|
|
import re
|
|
|
|
|
|
import asyncio
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
logger = get_logger(__name__)
|
|
|
|
|
|
|
2025-12-14 15:21:52 +08:00
|
|
|
|
# 全局请求限流器(使用信号量控制并发数)
|
|
|
|
|
|
_global_semaphore = asyncio.Semaphore(5) # 最多5个并发请求
|
|
|
|
|
|
_request_delay = 0.2 # 请求间隔200ms
|
|
|
|
|
|
|
2025-11-22 18:23:30 +08:00
|
|
|
|
# 全局HTTP客户端池(按配置复用)
|
|
|
|
|
|
_http_client_pool: Dict[str, httpx.AsyncClient] = {}
|
|
|
|
|
|
_client_pool_lock = False # 简单的锁标志
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def _get_client_key(provider: str, base_url: Optional[str], api_key: str) -> str:
|
|
|
|
|
|
"""生成HTTP客户端的唯一键
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
provider: 提供商名称
|
|
|
|
|
|
base_url: API基础URL
|
|
|
|
|
|
api_key: API密钥(用于区分不同用户)
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
客户端唯一键
|
|
|
|
|
|
"""
|
|
|
|
|
|
# 使用API密钥的哈希值(安全性)+ 提供商 + base_url 作为键
|
|
|
|
|
|
key_hash = hashlib.md5(api_key.encode()).hexdigest()[:8]
|
|
|
|
|
|
url_part = base_url or "default"
|
|
|
|
|
|
return f"{provider}_{url_part}_{key_hash}"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def _get_or_create_http_client(
|
|
|
|
|
|
provider: str,
|
|
|
|
|
|
base_url: Optional[str],
|
|
|
|
|
|
api_key: str
|
|
|
|
|
|
) -> httpx.AsyncClient:
|
|
|
|
|
|
"""获取或创建HTTP客户端(复用连接)
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
provider: 提供商名称
|
|
|
|
|
|
base_url: API基础URL
|
|
|
|
|
|
api_key: API密钥
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
httpx.AsyncClient实例
|
|
|
|
|
|
"""
|
|
|
|
|
|
global _http_client_pool
|
|
|
|
|
|
|
|
|
|
|
|
client_key = _get_client_key(provider, base_url, api_key)
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否已存在
|
|
|
|
|
|
if client_key in _http_client_pool:
|
|
|
|
|
|
client = _http_client_pool[client_key]
|
|
|
|
|
|
# 检查客户端是否仍然有效
|
|
|
|
|
|
if not client.is_closed:
|
|
|
|
|
|
logger.debug(f"♻️ 复用HTTP客户端: {client_key}")
|
|
|
|
|
|
return client
|
|
|
|
|
|
else:
|
|
|
|
|
|
# 客户端已关闭,从池中移除
|
|
|
|
|
|
logger.warning(f"⚠️ HTTP客户端已关闭,重新创建: {client_key}")
|
|
|
|
|
|
del _http_client_pool[client_key]
|
|
|
|
|
|
|
|
|
|
|
|
# 创建新客户端
|
|
|
|
|
|
limits = httpx.Limits(
|
|
|
|
|
|
max_keepalive_connections=50, # 最大保持连接数
|
|
|
|
|
|
max_connections=100, # 最大总连接数
|
|
|
|
|
|
keepalive_expiry=30.0 # 保持连接30秒
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
client = httpx.AsyncClient(
|
|
|
|
|
|
timeout=httpx.Timeout(
|
2025-11-24 20:42:09 +08:00
|
|
|
|
connect=90.0, # 连接超时
|
|
|
|
|
|
read=300.0, # 读取超时
|
|
|
|
|
|
write=90.0, # 写入超时
|
|
|
|
|
|
pool=90.0 # 连接池超时
|
2025-11-22 18:23:30 +08:00
|
|
|
|
),
|
|
|
|
|
|
limits=limits,
|
|
|
|
|
|
headers={
|
|
|
|
|
|
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36"
|
|
|
|
|
|
}
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 添加到池中
|
|
|
|
|
|
_http_client_pool[client_key] = client
|
|
|
|
|
|
logger.info(f"✅ 创建新HTTP客户端并加入池: {client_key} (池大小: {len(_http_client_pool)})")
|
|
|
|
|
|
|
|
|
|
|
|
return client
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
async def cleanup_http_clients():
|
|
|
|
|
|
"""清理所有HTTP客户端(应用关闭时调用)"""
|
|
|
|
|
|
global _http_client_pool
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"🧹 开始清理HTTP客户端池 (共 {len(_http_client_pool)} 个客户端)")
|
|
|
|
|
|
|
|
|
|
|
|
for key, client in list(_http_client_pool.items()):
|
|
|
|
|
|
try:
|
|
|
|
|
|
if not client.is_closed:
|
|
|
|
|
|
await client.aclose()
|
|
|
|
|
|
logger.debug(f"✅ 关闭HTTP客户端: {key}")
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ 关闭HTTP客户端失败 {key}: {e}")
|
|
|
|
|
|
|
|
|
|
|
|
_http_client_pool.clear()
|
|
|
|
|
|
logger.info("✅ HTTP客户端池清理完成")
|
|
|
|
|
|
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
class AIService:
|
2025-10-30 16:53:50 +08:00
|
|
|
|
"""AI服务统一接口 - 支持从用户设置或全局配置初始化"""
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-10-30 16:53:50 +08:00
|
|
|
|
def __init__(
|
|
|
|
|
|
self,
|
|
|
|
|
|
api_provider: Optional[str] = None,
|
|
|
|
|
|
api_key: Optional[str] = None,
|
|
|
|
|
|
api_base_url: Optional[str] = None,
|
|
|
|
|
|
default_model: Optional[str] = None,
|
|
|
|
|
|
default_temperature: Optional[float] = None,
|
2025-11-24 11:30:27 +08:00
|
|
|
|
default_max_tokens: Optional[int] = None,
|
|
|
|
|
|
enable_mcp_adapter: bool = True
|
2025-10-30 16:53:50 +08:00
|
|
|
|
):
|
|
|
|
|
|
"""
|
|
|
|
|
|
初始化AI客户端(优化并发性能)
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
api_provider: API提供商 (openai/anthropic),为None时使用全局配置
|
|
|
|
|
|
api_key: API密钥,为None时使用全局配置
|
|
|
|
|
|
api_base_url: API基础URL,为None时使用全局配置
|
|
|
|
|
|
default_model: 默认模型,为None时使用全局配置
|
|
|
|
|
|
default_temperature: 默认温度,为None时使用全局配置
|
|
|
|
|
|
default_max_tokens: 默认最大tokens,为None时使用全局配置
|
|
|
|
|
|
"""
|
|
|
|
|
|
# 保存用户设置或使用全局配置
|
|
|
|
|
|
self.api_provider = api_provider or app_settings.default_ai_provider
|
|
|
|
|
|
self.default_model = default_model or app_settings.default_model
|
|
|
|
|
|
self.default_temperature = default_temperature or app_settings.default_temperature
|
|
|
|
|
|
self.default_max_tokens = default_max_tokens or app_settings.default_max_tokens
|
|
|
|
|
|
|
2025-11-24 11:30:27 +08:00
|
|
|
|
# 初始化MCP适配器
|
|
|
|
|
|
self.enable_mcp_adapter = enable_mcp_adapter
|
|
|
|
|
|
if enable_mcp_adapter:
|
|
|
|
|
|
self.mcp_adapter = UniversalMCPAdapter()
|
|
|
|
|
|
logger.info("✅ MCP通用适配器已启用")
|
|
|
|
|
|
else:
|
|
|
|
|
|
self.mcp_adapter = None
|
|
|
|
|
|
logger.info("⚠️ MCP适配器已禁用")
|
|
|
|
|
|
|
2025-11-22 18:23:30 +08:00
|
|
|
|
# 初始化OpenAI客户端(使用HTTP客户端池)
|
2025-10-30 16:53:50 +08:00
|
|
|
|
openai_key = api_key if api_provider == "openai" else app_settings.openai_api_key
|
|
|
|
|
|
if openai_key:
|
2025-10-30 11:14:43 +08:00
|
|
|
|
try:
|
2025-11-22 18:23:30 +08:00
|
|
|
|
base_url = api_base_url if api_provider == "openai" else app_settings.openai_base_url
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-11-22 18:23:30 +08:00
|
|
|
|
# 从池中获取或创建HTTP客户端(复用连接)
|
|
|
|
|
|
http_client = _get_or_create_http_client("openai", base_url, openai_key)
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
client_kwargs = {
|
2025-10-30 16:53:50 +08:00
|
|
|
|
"api_key": openai_key,
|
2025-10-30 11:14:43 +08:00
|
|
|
|
"http_client": http_client
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-10-30 16:53:50 +08:00
|
|
|
|
if base_url:
|
|
|
|
|
|
client_kwargs["base_url"] = base_url
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
self.openai_client = AsyncOpenAI(**client_kwargs)
|
2025-11-03 15:28:51 +08:00
|
|
|
|
self.openai_http_client = http_client
|
|
|
|
|
|
self.openai_api_key = openai_key
|
|
|
|
|
|
self.openai_base_url = base_url
|
2025-11-22 18:23:30 +08:00
|
|
|
|
logger.info("✅ OpenAI客户端初始化成功(复用HTTP连接)")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"OpenAI客户端初始化失败: {e}")
|
|
|
|
|
|
self.openai_client = None
|
2025-11-03 15:28:51 +08:00
|
|
|
|
self.openai_http_client = None
|
|
|
|
|
|
self.openai_api_key = None
|
|
|
|
|
|
self.openai_base_url = None
|
2025-10-30 11:14:43 +08:00
|
|
|
|
else:
|
|
|
|
|
|
self.openai_client = None
|
2025-11-03 15:28:51 +08:00
|
|
|
|
self.openai_http_client = None
|
|
|
|
|
|
self.openai_api_key = None
|
|
|
|
|
|
self.openai_base_url = None
|
2025-11-10 21:16:55 +08:00
|
|
|
|
# 只有当用户明确选择OpenAI作为提供商时才警告
|
|
|
|
|
|
if self.api_provider == "openai":
|
|
|
|
|
|
logger.warning("⚠️ OpenAI API key未配置,但被设置为当前AI提供商")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-11-22 18:23:30 +08:00
|
|
|
|
# 初始化Anthropic客户端(使用HTTP客户端池)
|
2025-10-30 16:53:50 +08:00
|
|
|
|
anthropic_key = api_key if api_provider == "anthropic" else app_settings.anthropic_api_key
|
|
|
|
|
|
if anthropic_key:
|
2025-10-30 11:14:43 +08:00
|
|
|
|
try:
|
2025-11-22 18:23:30 +08:00
|
|
|
|
base_url = api_base_url if api_provider == "anthropic" else app_settings.anthropic_base_url
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-11-22 18:23:30 +08:00
|
|
|
|
# 从池中获取或创建HTTP客户端(复用连接)
|
|
|
|
|
|
http_client = _get_or_create_http_client("anthropic", base_url, anthropic_key)
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
client_kwargs = {
|
2025-10-30 16:53:50 +08:00
|
|
|
|
"api_key": anthropic_key,
|
2025-10-30 11:14:43 +08:00
|
|
|
|
"http_client": http_client
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-10-30 16:53:50 +08:00
|
|
|
|
if base_url:
|
|
|
|
|
|
client_kwargs["base_url"] = base_url
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
self.anthropic_client = AsyncAnthropic(**client_kwargs)
|
2025-11-22 18:23:30 +08:00
|
|
|
|
logger.info("✅ Anthropic客户端初始化成功(复用HTTP连接)")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"Anthropic客户端初始化失败: {e}")
|
|
|
|
|
|
self.anthropic_client = None
|
|
|
|
|
|
else:
|
|
|
|
|
|
self.anthropic_client = None
|
2025-11-10 21:16:55 +08:00
|
|
|
|
# 只有当用户明确选择Anthropic作为提供商时才警告
|
|
|
|
|
|
if self.api_provider == "anthropic":
|
|
|
|
|
|
logger.warning("⚠️ Anthropic API key未配置,但被设置为当前AI提供商")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
async def generate_text(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
provider: Optional[str] = None,
|
|
|
|
|
|
model: Optional[str] = None,
|
|
|
|
|
|
temperature: Optional[float] = None,
|
|
|
|
|
|
max_tokens: Optional[int] = None,
|
2025-11-07 22:14:20 +08:00
|
|
|
|
system_prompt: Optional[str] = None,
|
|
|
|
|
|
tools: Optional[List[Dict[str, Any]]] = None,
|
|
|
|
|
|
tool_choice: Optional[str] = None
|
|
|
|
|
|
) -> Dict[str, Any]:
|
2025-10-30 11:14:43 +08:00
|
|
|
|
"""
|
2025-11-07 22:14:20 +08:00
|
|
|
|
生成文本(支持工具调用)
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
prompt: 用户提示词
|
|
|
|
|
|
provider: AI提供商 (openai/anthropic)
|
|
|
|
|
|
model: 模型名称
|
|
|
|
|
|
temperature: 温度参数
|
|
|
|
|
|
max_tokens: 最大token数
|
|
|
|
|
|
system_prompt: 系统提示词
|
2025-11-07 22:14:20 +08:00
|
|
|
|
tools: 可用工具列表(MCP工具格式)
|
|
|
|
|
|
tool_choice: 工具选择策略 (auto/required/none)
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
Returns:
|
2025-11-07 22:14:20 +08:00
|
|
|
|
Dict包含:
|
|
|
|
|
|
- content: 文本内容(如果没有工具调用)
|
|
|
|
|
|
- tool_calls: 工具调用列表(如果AI决定调用工具)
|
|
|
|
|
|
- finish_reason: 完成原因
|
2025-10-30 11:14:43 +08:00
|
|
|
|
"""
|
2025-10-30 16:53:50 +08:00
|
|
|
|
provider = provider or self.api_provider
|
|
|
|
|
|
model = model or self.default_model
|
|
|
|
|
|
temperature = temperature or self.default_temperature
|
|
|
|
|
|
max_tokens = max_tokens or self.default_max_tokens
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
if provider == "openai":
|
2025-11-07 22:14:20 +08:00
|
|
|
|
return await self._generate_openai_with_tools(
|
|
|
|
|
|
prompt, model, temperature, max_tokens, system_prompt, tools, tool_choice
|
2025-10-30 11:14:43 +08:00
|
|
|
|
)
|
|
|
|
|
|
elif provider == "anthropic":
|
2025-11-07 22:14:20 +08:00
|
|
|
|
return await self._generate_anthropic_with_tools(
|
|
|
|
|
|
prompt, model, temperature, max_tokens, system_prompt, tools, tool_choice
|
2025-10-30 11:14:43 +08:00
|
|
|
|
)
|
|
|
|
|
|
else:
|
|
|
|
|
|
raise ValueError(f"不支持的AI提供商: {provider}")
|
|
|
|
|
|
|
|
|
|
|
|
async def generate_text_stream(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
provider: Optional[str] = None,
|
|
|
|
|
|
model: Optional[str] = None,
|
|
|
|
|
|
temperature: Optional[float] = None,
|
|
|
|
|
|
max_tokens: Optional[int] = None,
|
|
|
|
|
|
system_prompt: Optional[str] = None
|
|
|
|
|
|
) -> AsyncGenerator[str, None]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
流式生成文本
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
prompt: 用户提示词
|
|
|
|
|
|
provider: AI提供商
|
|
|
|
|
|
model: 模型名称
|
|
|
|
|
|
temperature: 温度参数
|
|
|
|
|
|
max_tokens: 最大token数
|
|
|
|
|
|
system_prompt: 系统提示词
|
|
|
|
|
|
|
|
|
|
|
|
Yields:
|
|
|
|
|
|
生成的文本片段
|
|
|
|
|
|
"""
|
2025-10-30 16:53:50 +08:00
|
|
|
|
provider = provider or self.api_provider
|
|
|
|
|
|
model = model or self.default_model
|
|
|
|
|
|
temperature = temperature or self.default_temperature
|
|
|
|
|
|
max_tokens = max_tokens or self.default_max_tokens
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
if provider == "openai":
|
|
|
|
|
|
async for chunk in self._generate_openai_stream(
|
|
|
|
|
|
prompt, model, temperature, max_tokens, system_prompt
|
|
|
|
|
|
):
|
|
|
|
|
|
yield chunk
|
|
|
|
|
|
elif provider == "anthropic":
|
|
|
|
|
|
async for chunk in self._generate_anthropic_stream(
|
|
|
|
|
|
prompt, model, temperature, max_tokens, system_prompt
|
|
|
|
|
|
):
|
|
|
|
|
|
yield chunk
|
|
|
|
|
|
else:
|
|
|
|
|
|
raise ValueError(f"不支持的AI提供商: {provider}")
|
|
|
|
|
|
|
|
|
|
|
|
async def _generate_openai(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str]
|
|
|
|
|
|
) -> str:
|
2025-12-14 15:21:52 +08:00
|
|
|
|
"""使用OpenAI生成文本(带限流和重试)"""
|
2025-11-03 15:28:51 +08:00
|
|
|
|
if not self.openai_http_client:
|
2025-10-30 11:14:43 +08:00
|
|
|
|
raise ValueError("OpenAI客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
messages = []
|
|
|
|
|
|
if system_prompt:
|
|
|
|
|
|
messages.append({"role": "system", "content": system_prompt})
|
|
|
|
|
|
messages.append({"role": "user", "content": prompt})
|
|
|
|
|
|
|
2025-12-14 15:21:52 +08:00
|
|
|
|
# 使用全局信号量限流
|
|
|
|
|
|
async with _global_semaphore:
|
|
|
|
|
|
# 请求间隔
|
|
|
|
|
|
await asyncio.sleep(_request_delay)
|
2025-11-03 15:28:51 +08:00
|
|
|
|
|
2025-12-14 15:21:52 +08:00
|
|
|
|
# 重试机制
|
|
|
|
|
|
max_retries = 3
|
|
|
|
|
|
for attempt in range(max_retries):
|
|
|
|
|
|
try:
|
|
|
|
|
|
if attempt > 0:
|
|
|
|
|
|
wait_time = min(2 ** attempt, 10) # 指数退避
|
|
|
|
|
|
logger.warning(f"⚠️ OpenAI API调用失败,{wait_time}秒后重试(第{attempt + 1}/{max_retries}次)")
|
|
|
|
|
|
await asyncio.sleep(wait_time)
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"🔵 开始调用OpenAI API(尝试 {attempt + 1}/{max_retries})")
|
|
|
|
|
|
logger.info(f" - 模型: {model}")
|
|
|
|
|
|
logger.info(f" - 温度: {temperature}")
|
|
|
|
|
|
logger.info(f" - 最大tokens: {max_tokens}")
|
|
|
|
|
|
logger.info(f" - Prompt长度: {len(prompt)} 字符")
|
|
|
|
|
|
logger.info(f" - 消息数量: {len(messages)}")
|
|
|
|
|
|
|
|
|
|
|
|
url = f"{self.openai_base_url}/chat/completions"
|
|
|
|
|
|
headers = {
|
|
|
|
|
|
"Authorization": f"Bearer {self.openai_api_key}",
|
|
|
|
|
|
"Content-Type": "application/json"
|
|
|
|
|
|
}
|
|
|
|
|
|
payload = {
|
|
|
|
|
|
"model": model,
|
|
|
|
|
|
"messages": messages,
|
|
|
|
|
|
"temperature": temperature,
|
|
|
|
|
|
"max_tokens": max_tokens
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
logger.debug(f" - 请求URL: {url}")
|
|
|
|
|
|
logger.debug(f" - 请求头: Authorization=Bearer ***")
|
|
|
|
|
|
|
|
|
|
|
|
response = await self.openai_http_client.post(url, headers=headers, json=payload)
|
|
|
|
|
|
response.raise_for_status()
|
|
|
|
|
|
|
|
|
|
|
|
data = response.json()
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"✅ OpenAI API调用成功")
|
|
|
|
|
|
logger.info(f" - 响应ID: {data.get('id', 'N/A')}")
|
|
|
|
|
|
logger.info(f" - 选项数量: {len(data.get('choices', []))}")
|
|
|
|
|
|
logger.debug(f" - 完整API响应: {data}")
|
|
|
|
|
|
|
|
|
|
|
|
if not data.get('choices'):
|
|
|
|
|
|
logger.error("❌ OpenAI返回的choices为空")
|
|
|
|
|
|
raise ValueError("API返回的响应格式错误:choices字段为空")
|
|
|
|
|
|
|
|
|
|
|
|
choice = data['choices'][0]
|
|
|
|
|
|
message = choice.get('message', {})
|
|
|
|
|
|
finish_reason = choice.get('finish_reason')
|
|
|
|
|
|
|
|
|
|
|
|
# DeepSeek R1特殊处理:只使用content(最终答案),忽略reasoning_content(思考过程)
|
|
|
|
|
|
# reasoning_content是AI的思考过程,不是我们需要的JSON结果
|
|
|
|
|
|
content = message.get('content', '')
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否因达到长度限制而截断
|
|
|
|
|
|
if finish_reason == 'length':
|
|
|
|
|
|
logger.warning(f"⚠️ 响应因达到max_tokens限制而被截断")
|
|
|
|
|
|
logger.warning(f" - 当前max_tokens: {max_tokens}")
|
|
|
|
|
|
logger.warning(f" - 建议: 增加max_tokens参数(推荐2000+)")
|
|
|
|
|
|
|
|
|
|
|
|
if content:
|
|
|
|
|
|
logger.info(f" - 返回内容长度: {len(content)} 字符")
|
|
|
|
|
|
logger.info(f" - 完成原因: {finish_reason}")
|
|
|
|
|
|
logger.info(f" - 返回内容预览(前200字符): {content[:200]}")
|
|
|
|
|
|
return content
|
|
|
|
|
|
else:
|
|
|
|
|
|
logger.error("❌ AI返回了空内容")
|
|
|
|
|
|
logger.error(f" - 完整响应: {data}")
|
|
|
|
|
|
logger.error(f" - 完成原因: {finish_reason}")
|
|
|
|
|
|
|
|
|
|
|
|
# 提供更详细的错误信息
|
|
|
|
|
|
if finish_reason == 'length':
|
|
|
|
|
|
raise ValueError(f"AI响应被截断且无有效内容。请增加max_tokens参数(当前: {max_tokens},建议: 2000+)")
|
|
|
|
|
|
else:
|
|
|
|
|
|
raise ValueError(f"AI返回了空内容(finish_reason: {finish_reason}),请检查API配置或稍后重试")
|
2025-11-03 15:28:51 +08:00
|
|
|
|
|
2025-12-14 15:21:52 +08:00
|
|
|
|
except httpx.ConnectError as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API连接失败 (尝试 {attempt + 1}/{max_retries}): {str(e)}")
|
|
|
|
|
|
if attempt == max_retries - 1:
|
|
|
|
|
|
raise Exception(f"连接失败,已重试{max_retries}次。请检查网络连接或API地址: {str(e)}")
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
except httpx.HTTPStatusError as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API调用失败 (HTTP {e.response.status_code}, 尝试 {attempt + 1}/{max_retries})")
|
|
|
|
|
|
logger.error(f" - 错误信息: {e.response.text}")
|
|
|
|
|
|
|
|
|
|
|
|
# 某些错误不需要重试(如401、403)
|
|
|
|
|
|
if e.response.status_code in [401, 403, 404]:
|
|
|
|
|
|
raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
|
|
|
|
|
|
|
|
|
|
|
|
if attempt == max_retries - 1:
|
|
|
|
|
|
raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
except httpx.TimeoutException as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API超时 (尝试 {attempt + 1}/{max_retries})")
|
|
|
|
|
|
if attempt == max_retries - 1:
|
|
|
|
|
|
raise Exception(f"API请求超时,已重试{max_retries}次: {str(e)}")
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API调用失败 (尝试 {attempt + 1}/{max_retries})")
|
|
|
|
|
|
logger.error(f" - 错误类型: {type(e).__name__}")
|
|
|
|
|
|
logger.error(f" - 错误信息: {str(e)}")
|
|
|
|
|
|
|
|
|
|
|
|
if attempt == max_retries - 1:
|
|
|
|
|
|
raise
|
|
|
|
|
|
continue
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-11-07 22:14:20 +08:00
|
|
|
|
|
|
|
|
|
|
async def _generate_openai_with_tools(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str],
|
|
|
|
|
|
tools: Optional[List[Dict[str, Any]]] = None,
|
|
|
|
|
|
tool_choice: Optional[str] = None
|
|
|
|
|
|
) -> Dict[str, Any]:
|
2025-11-24 11:30:27 +08:00
|
|
|
|
"""使用OpenAI生成文本(支持工具调用,集成MCP适配器)"""
|
2025-11-07 22:14:20 +08:00
|
|
|
|
if not self.openai_http_client:
|
|
|
|
|
|
raise ValueError("OpenAI客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
messages = []
|
|
|
|
|
|
if system_prompt:
|
|
|
|
|
|
messages.append({"role": "system", "content": system_prompt})
|
|
|
|
|
|
messages.append({"role": "user", "content": prompt})
|
|
|
|
|
|
|
2025-11-24 11:30:27 +08:00
|
|
|
|
# 如果启用了MCP适配器且有工具,使用适配器处理
|
|
|
|
|
|
if self.enable_mcp_adapter and self.mcp_adapter and tools:
|
|
|
|
|
|
logger.info(f"🎯 使用MCP适配器处理工具调用")
|
|
|
|
|
|
|
|
|
|
|
|
# 生成API标识符
|
|
|
|
|
|
api_identifier = f"openai_{self.openai_base_url or 'default'}"
|
|
|
|
|
|
|
|
|
|
|
|
# 定义API调用函数
|
|
|
|
|
|
async def call_api(message: str, tools_param: Optional[List] = None, tool_choice_param: Optional[str] = None):
|
|
|
|
|
|
"""实际调用OpenAI API的函数"""
|
|
|
|
|
|
call_messages = messages.copy()
|
|
|
|
|
|
call_messages[-1]["content"] = message
|
|
|
|
|
|
|
|
|
|
|
|
url = f"{self.openai_base_url}/chat/completions"
|
|
|
|
|
|
headers = {
|
|
|
|
|
|
"Authorization": f"Bearer {self.openai_api_key}",
|
|
|
|
|
|
"Content-Type": "application/json"
|
|
|
|
|
|
}
|
|
|
|
|
|
payload = {
|
|
|
|
|
|
"model": model,
|
|
|
|
|
|
"messages": call_messages,
|
|
|
|
|
|
"temperature": temperature,
|
|
|
|
|
|
"max_tokens": max_tokens
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
# 只在tools_param不为None时添加工具参数
|
|
|
|
|
|
if tools_param is not None:
|
|
|
|
|
|
# 清理工具定义,移除$schema字段(某些API不支持)
|
|
|
|
|
|
cleaned_tools = []
|
|
|
|
|
|
for tool in tools_param:
|
|
|
|
|
|
cleaned_tool = tool.copy()
|
|
|
|
|
|
if "function" in cleaned_tool and "parameters" in cleaned_tool["function"]:
|
|
|
|
|
|
params = cleaned_tool["function"]["parameters"].copy()
|
|
|
|
|
|
# 移除$schema字段
|
|
|
|
|
|
params.pop("$schema", None)
|
|
|
|
|
|
cleaned_tool["function"]["parameters"] = params
|
|
|
|
|
|
cleaned_tools.append(cleaned_tool)
|
|
|
|
|
|
|
|
|
|
|
|
payload["tools"] = cleaned_tools
|
|
|
|
|
|
if tool_choice_param:
|
|
|
|
|
|
payload["tool_choice"] = tool_choice_param
|
|
|
|
|
|
|
|
|
|
|
|
response = await self.openai_http_client.post(url, headers=headers, json=payload)
|
|
|
|
|
|
response.raise_for_status()
|
|
|
|
|
|
return response.json()
|
|
|
|
|
|
|
|
|
|
|
|
# 定义测试函数(检测API是否支持Function Calling)
|
|
|
|
|
|
async def test_fc():
|
|
|
|
|
|
"""测试Function Calling支持"""
|
|
|
|
|
|
test_tools = [{
|
|
|
|
|
|
"type": "function",
|
|
|
|
|
|
"function": {
|
|
|
|
|
|
"name": "test_function",
|
|
|
|
|
|
"description": "测试函数",
|
|
|
|
|
|
"parameters": {"type": "object", "properties": {}}
|
|
|
|
|
|
}
|
|
|
|
|
|
}]
|
|
|
|
|
|
try:
|
|
|
|
|
|
result = await call_api("测试", tools_param=test_tools, tool_choice_param="none")
|
|
|
|
|
|
return result
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.debug(f"Function Calling测试失败: {e}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
# 使用适配器处理(自动检测、降级、缓存)
|
|
|
|
|
|
result = await self.mcp_adapter.call_with_fallback(
|
|
|
|
|
|
api_identifier=api_identifier,
|
|
|
|
|
|
tools=tools,
|
|
|
|
|
|
user_message=prompt,
|
|
|
|
|
|
call_function=call_api,
|
|
|
|
|
|
test_function=test_fc
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 转换结果格式
|
|
|
|
|
|
if result.has_tool_calls:
|
|
|
|
|
|
return {
|
|
|
|
|
|
"tool_calls": result.tool_calls,
|
|
|
|
|
|
"content": result.raw_response,
|
|
|
|
|
|
"finish_reason": "tool_calls"
|
|
|
|
|
|
}
|
|
|
|
|
|
else:
|
|
|
|
|
|
return {
|
|
|
|
|
|
"content": result.raw_response,
|
|
|
|
|
|
"finish_reason": "stop"
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ MCP适配器调用失败: {str(e)}")
|
|
|
|
|
|
# 降级到原始实现
|
|
|
|
|
|
logger.warning("⚠️ 降级到原始OpenAI调用")
|
|
|
|
|
|
|
|
|
|
|
|
# 原始实现(无适配器或降级)
|
2025-11-07 22:14:20 +08:00
|
|
|
|
try:
|
2025-11-24 11:30:27 +08:00
|
|
|
|
logger.info(f"🔵 开始调用OpenAI API(原始模式)")
|
2025-11-07 22:14:20 +08:00
|
|
|
|
logger.info(f" - 模型: {model}")
|
|
|
|
|
|
logger.info(f" - 工具数量: {len(tools) if tools else 0}")
|
|
|
|
|
|
|
|
|
|
|
|
url = f"{self.openai_base_url}/chat/completions"
|
|
|
|
|
|
headers = {
|
|
|
|
|
|
"Authorization": f"Bearer {self.openai_api_key}",
|
|
|
|
|
|
"Content-Type": "application/json"
|
|
|
|
|
|
}
|
|
|
|
|
|
payload = {
|
|
|
|
|
|
"model": model,
|
|
|
|
|
|
"messages": messages,
|
|
|
|
|
|
"temperature": temperature,
|
|
|
|
|
|
"max_tokens": max_tokens
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
# 添加工具参数
|
|
|
|
|
|
if tools:
|
|
|
|
|
|
payload["tools"] = tools
|
|
|
|
|
|
if tool_choice:
|
|
|
|
|
|
if tool_choice == "required":
|
|
|
|
|
|
payload["tool_choice"] = "required"
|
|
|
|
|
|
elif tool_choice == "auto":
|
|
|
|
|
|
payload["tool_choice"] = "auto"
|
|
|
|
|
|
elif tool_choice == "none":
|
|
|
|
|
|
payload["tool_choice"] = "none"
|
|
|
|
|
|
|
|
|
|
|
|
response = await self.openai_http_client.post(url, headers=headers, json=payload)
|
|
|
|
|
|
response.raise_for_status()
|
|
|
|
|
|
|
|
|
|
|
|
data = response.json()
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"✅ OpenAI API调用成功")
|
|
|
|
|
|
logger.debug(f" - 完整API响应: {data}")
|
|
|
|
|
|
|
|
|
|
|
|
if not data.get('choices'):
|
|
|
|
|
|
logger.error(f"❌ API返回的choices为空")
|
|
|
|
|
|
logger.error(f" - 完整响应: {data}")
|
|
|
|
|
|
logger.error(f" - 响应键: {list(data.keys())}")
|
|
|
|
|
|
raise ValueError(f"API返回的响应格式错误:choices字段为空。完整响应: {data}")
|
|
|
|
|
|
|
|
|
|
|
|
choice = data['choices'][0]
|
|
|
|
|
|
message = choice.get('message', {})
|
|
|
|
|
|
finish_reason = choice.get('finish_reason')
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否有工具调用
|
|
|
|
|
|
tool_calls = message.get('tool_calls')
|
|
|
|
|
|
if tool_calls:
|
|
|
|
|
|
logger.info(f"🔧 AI请求调用 {len(tool_calls)} 个工具")
|
|
|
|
|
|
return {
|
|
|
|
|
|
"tool_calls": tool_calls,
|
|
|
|
|
|
"content": message.get('content', ''),
|
|
|
|
|
|
"finish_reason": finish_reason
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
# 没有工具调用,返回普通内容
|
|
|
|
|
|
content = message.get('content', '')
|
|
|
|
|
|
if content:
|
|
|
|
|
|
return {
|
|
|
|
|
|
"content": content,
|
|
|
|
|
|
"finish_reason": finish_reason
|
|
|
|
|
|
}
|
|
|
|
|
|
else:
|
|
|
|
|
|
raise ValueError(f"AI返回了空内容(finish_reason: {finish_reason})")
|
|
|
|
|
|
|
|
|
|
|
|
except httpx.HTTPStatusError as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API调用失败 (HTTP {e.response.status_code})")
|
|
|
|
|
|
logger.error(f" - 错误信息: {e.response.text}")
|
|
|
|
|
|
raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI API调用失败: {str(e)}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
async def _generate_anthropic_with_tools(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str],
|
|
|
|
|
|
tools: Optional[List[Dict[str, Any]]] = None,
|
|
|
|
|
|
tool_choice: Optional[str] = None
|
|
|
|
|
|
) -> Dict[str, Any]:
|
|
|
|
|
|
"""使用Anthropic生成文本(支持工具调用)"""
|
|
|
|
|
|
if not self.anthropic_client:
|
|
|
|
|
|
raise ValueError("Anthropic客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
logger.info(f"🔵 开始调用Anthropic API(支持工具调用)")
|
|
|
|
|
|
logger.info(f" - 模型: {model}")
|
|
|
|
|
|
logger.info(f" - 工具数量: {len(tools) if tools else 0}")
|
|
|
|
|
|
|
|
|
|
|
|
kwargs = {
|
|
|
|
|
|
"model": model,
|
|
|
|
|
|
"max_tokens": max_tokens,
|
|
|
|
|
|
"temperature": temperature,
|
|
|
|
|
|
"messages": [{"role": "user", "content": prompt}]
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
if system_prompt:
|
|
|
|
|
|
kwargs["system"] = system_prompt
|
|
|
|
|
|
|
|
|
|
|
|
# 添加工具参数
|
|
|
|
|
|
if tools:
|
|
|
|
|
|
kwargs["tools"] = tools
|
|
|
|
|
|
if tool_choice == "required":
|
|
|
|
|
|
kwargs["tool_choice"] = {"type": "any"}
|
|
|
|
|
|
elif tool_choice == "auto":
|
|
|
|
|
|
kwargs["tool_choice"] = {"type": "auto"}
|
|
|
|
|
|
|
|
|
|
|
|
response = await self.anthropic_client.messages.create(**kwargs)
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否有工具调用
|
|
|
|
|
|
tool_calls = []
|
|
|
|
|
|
content_text = ""
|
|
|
|
|
|
|
|
|
|
|
|
for block in response.content:
|
|
|
|
|
|
if block.type == "tool_use":
|
|
|
|
|
|
tool_calls.append({
|
|
|
|
|
|
"id": block.id,
|
|
|
|
|
|
"type": "function",
|
|
|
|
|
|
"function": {
|
|
|
|
|
|
"name": block.name,
|
|
|
|
|
|
"arguments": block.input
|
|
|
|
|
|
}
|
|
|
|
|
|
})
|
|
|
|
|
|
elif block.type == "text":
|
|
|
|
|
|
content_text += block.text
|
|
|
|
|
|
|
|
|
|
|
|
if tool_calls:
|
|
|
|
|
|
logger.info(f"🔧 AI请求调用 {len(tool_calls)} 个工具")
|
|
|
|
|
|
return {
|
|
|
|
|
|
"tool_calls": tool_calls,
|
|
|
|
|
|
"content": content_text,
|
|
|
|
|
|
"finish_reason": response.stop_reason
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
return {
|
|
|
|
|
|
"content": content_text,
|
|
|
|
|
|
"finish_reason": response.stop_reason
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ Anthropic API调用失败: {str(e)}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
2025-10-30 11:14:43 +08:00
|
|
|
|
async def _generate_openai_stream(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str]
|
|
|
|
|
|
) -> AsyncGenerator[str, None]:
|
|
|
|
|
|
"""使用OpenAI流式生成文本"""
|
2025-11-03 15:28:51 +08:00
|
|
|
|
if not self.openai_http_client:
|
2025-10-30 11:14:43 +08:00
|
|
|
|
raise ValueError("OpenAI客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
messages = []
|
|
|
|
|
|
if system_prompt:
|
|
|
|
|
|
messages.append({"role": "system", "content": system_prompt})
|
|
|
|
|
|
messages.append({"role": "user", "content": prompt})
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
2025-11-03 15:28:51 +08:00
|
|
|
|
logger.info(f"🔵 开始调用OpenAI流式API(直接HTTP请求)")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
logger.info(f" - 模型: {model}")
|
|
|
|
|
|
logger.info(f" - Prompt长度: {len(prompt)} 字符")
|
|
|
|
|
|
logger.info(f" - 最大tokens: {max_tokens}")
|
|
|
|
|
|
|
2025-11-03 15:28:51 +08:00
|
|
|
|
url = f"{self.openai_base_url}/chat/completions"
|
|
|
|
|
|
headers = {
|
|
|
|
|
|
"Authorization": f"Bearer {self.openai_api_key}",
|
|
|
|
|
|
"Content-Type": "application/json"
|
|
|
|
|
|
}
|
|
|
|
|
|
payload = {
|
|
|
|
|
|
"model": model,
|
|
|
|
|
|
"messages": messages,
|
|
|
|
|
|
"temperature": temperature,
|
|
|
|
|
|
"max_tokens": max_tokens,
|
|
|
|
|
|
"stream": True
|
|
|
|
|
|
}
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
2025-11-03 15:28:51 +08:00
|
|
|
|
async with self.openai_http_client.stream('POST', url, headers=headers, json=payload) as response:
|
|
|
|
|
|
response.raise_for_status()
|
|
|
|
|
|
logger.info(f"✅ OpenAI流式API连接成功,开始接收数据...")
|
|
|
|
|
|
|
|
|
|
|
|
chunk_count = 0
|
|
|
|
|
|
has_content = False
|
|
|
|
|
|
finish_reason = None
|
|
|
|
|
|
|
|
|
|
|
|
async for line in response.aiter_lines():
|
|
|
|
|
|
if line.startswith('data: '):
|
|
|
|
|
|
data_str = line[6:]
|
|
|
|
|
|
if data_str.strip() == '[DONE]':
|
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
import json
|
|
|
|
|
|
data = json.loads(data_str)
|
|
|
|
|
|
if 'choices' in data and len(data['choices']) > 0:
|
|
|
|
|
|
choice = data['choices'][0]
|
|
|
|
|
|
delta = choice.get('delta', {})
|
|
|
|
|
|
finish_reason = choice.get('finish_reason') or finish_reason
|
|
|
|
|
|
|
|
|
|
|
|
# DeepSeek R1特殊处理:只收集content(最终答案),忽略reasoning_content(思考过程)
|
|
|
|
|
|
# reasoning_content是AI的思考过程,不是我们需要的JSON结果
|
|
|
|
|
|
content = delta.get('content', '')
|
|
|
|
|
|
|
|
|
|
|
|
if content:
|
|
|
|
|
|
chunk_count += 1
|
|
|
|
|
|
has_content = True
|
|
|
|
|
|
yield content
|
|
|
|
|
|
except json.JSONDecodeError:
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否因长度限制截断
|
|
|
|
|
|
if finish_reason == 'length':
|
|
|
|
|
|
logger.warning(f"⚠️ 流式响应因达到max_tokens限制而被截断")
|
|
|
|
|
|
logger.warning(f" - 当前max_tokens: {max_tokens}")
|
|
|
|
|
|
logger.warning(f" - 建议: 增加max_tokens参数(推荐2000+)")
|
|
|
|
|
|
|
|
|
|
|
|
if not has_content:
|
|
|
|
|
|
logger.warning(f"⚠️ 流式响应未返回任何内容")
|
|
|
|
|
|
logger.warning(f" - 完成原因: {finish_reason}")
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"✅ OpenAI流式生成完成,共接收 {chunk_count} 个chunk,完成原因: {finish_reason}")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
except httpx.TimeoutException as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI流式API超时")
|
|
|
|
|
|
logger.error(f" - 错误: {str(e)}")
|
|
|
|
|
|
logger.error(f" - 提示: 请检查网络连接或考虑缩短prompt长度")
|
|
|
|
|
|
raise TimeoutError(f"AI服务超时(180秒),请稍后重试或减少上下文长度") from e
|
2025-11-03 15:28:51 +08:00
|
|
|
|
except httpx.HTTPStatusError as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI流式API调用失败 (HTTP {e.response.status_code})")
|
|
|
|
|
|
logger.error(f" - 错误信息: {await e.response.aread()}")
|
|
|
|
|
|
raise
|
2025-10-30 11:14:43 +08:00
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ OpenAI流式API调用失败: {str(e)}")
|
|
|
|
|
|
logger.error(f" - 错误类型: {type(e).__name__}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
async def _generate_anthropic(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str]
|
|
|
|
|
|
) -> str:
|
|
|
|
|
|
"""使用Anthropic生成文本"""
|
|
|
|
|
|
if not self.anthropic_client:
|
|
|
|
|
|
raise ValueError("Anthropic客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
response = await self.anthropic_client.messages.create(
|
|
|
|
|
|
model=model,
|
|
|
|
|
|
max_tokens=max_tokens,
|
|
|
|
|
|
temperature=temperature,
|
|
|
|
|
|
system=system_prompt or "",
|
|
|
|
|
|
messages=[{"role": "user", "content": prompt}]
|
|
|
|
|
|
)
|
|
|
|
|
|
return response.content[0].text
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"Anthropic API调用失败: {str(e)}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
async def _generate_anthropic_stream(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
model: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int,
|
|
|
|
|
|
system_prompt: Optional[str]
|
|
|
|
|
|
) -> AsyncGenerator[str, None]:
|
|
|
|
|
|
"""使用Anthropic流式生成文本"""
|
|
|
|
|
|
if not self.anthropic_client:
|
|
|
|
|
|
raise ValueError("Anthropic客户端未初始化,请检查API key配置")
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
logger.info(f"🔵 开始调用Anthropic流式API")
|
|
|
|
|
|
logger.info(f" - 模型: {model}")
|
|
|
|
|
|
logger.info(f" - Prompt长度: {len(prompt)} 字符")
|
|
|
|
|
|
logger.info(f" - 最大tokens: {max_tokens}")
|
|
|
|
|
|
|
|
|
|
|
|
async with self.anthropic_client.messages.stream(
|
|
|
|
|
|
model=model,
|
|
|
|
|
|
max_tokens=max_tokens,
|
|
|
|
|
|
temperature=temperature,
|
|
|
|
|
|
system=system_prompt or "",
|
|
|
|
|
|
messages=[{"role": "user", "content": prompt}]
|
|
|
|
|
|
) as stream:
|
|
|
|
|
|
logger.info(f"✅ Anthropic流式API连接成功,开始接收数据...")
|
|
|
|
|
|
|
|
|
|
|
|
chunk_count = 0
|
|
|
|
|
|
async for text in stream.text_stream:
|
|
|
|
|
|
chunk_count += 1
|
|
|
|
|
|
yield text
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"✅ Anthropic流式生成完成,共接收 {chunk_count} 个chunk")
|
|
|
|
|
|
|
|
|
|
|
|
except httpx.TimeoutException as e:
|
|
|
|
|
|
logger.error(f"❌ Anthropic流式API超时")
|
|
|
|
|
|
logger.error(f" - 错误: {str(e)}")
|
|
|
|
|
|
raise TimeoutError(f"AI服务超时(180秒),请稍后重试或减少上下文长度") from e
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ Anthropic流式API调用失败: {str(e)}")
|
|
|
|
|
|
logger.error(f" - 错误类型: {type(e).__name__}")
|
|
|
|
|
|
raise
|
2025-11-07 22:14:20 +08:00
|
|
|
|
|
|
|
|
|
|
async def generate_text_with_mcp(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
user_id: str,
|
|
|
|
|
|
db_session,
|
|
|
|
|
|
enable_mcp: bool = True,
|
|
|
|
|
|
max_tool_rounds: int = 3,
|
|
|
|
|
|
tool_choice: str = "auto",
|
|
|
|
|
|
**kwargs
|
|
|
|
|
|
) -> Dict[str, Any]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
支持MCP工具的AI文本生成(非流式)
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
prompt: 用户提示词
|
|
|
|
|
|
user_id: 用户ID,用于获取MCP工具
|
|
|
|
|
|
db_session: 数据库会话
|
|
|
|
|
|
enable_mcp: 是否启用MCP增强
|
|
|
|
|
|
max_tool_rounds: 最大工具调用轮次
|
|
|
|
|
|
tool_choice: 工具选择策略(auto/required/none)
|
|
|
|
|
|
**kwargs: 其他AI参数(provider, model, temperature等)
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
{
|
|
|
|
|
|
"content": "AI生成的最终文本",
|
|
|
|
|
|
"tool_calls_made": 2, # 实际调用的工具次数
|
|
|
|
|
|
"tools_used": ["exa_search", "filesystem_read"],
|
|
|
|
|
|
"finish_reason": "stop",
|
|
|
|
|
|
"mcp_enhanced": True
|
|
|
|
|
|
}
|
|
|
|
|
|
"""
|
|
|
|
|
|
from app.services.mcp_tool_service import mcp_tool_service, MCPToolServiceError
|
|
|
|
|
|
|
|
|
|
|
|
# 初始化返回结果
|
|
|
|
|
|
result = {
|
|
|
|
|
|
"content": "",
|
|
|
|
|
|
"tool_calls_made": 0,
|
|
|
|
|
|
"tools_used": [],
|
|
|
|
|
|
"finish_reason": "",
|
|
|
|
|
|
"mcp_enhanced": False
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
# 1. 获取MCP工具(如果启用)
|
|
|
|
|
|
tools = None
|
|
|
|
|
|
if enable_mcp:
|
|
|
|
|
|
try:
|
|
|
|
|
|
tools = await mcp_tool_service.get_user_enabled_tools(
|
|
|
|
|
|
user_id=user_id,
|
|
|
|
|
|
db_session=db_session
|
|
|
|
|
|
)
|
|
|
|
|
|
if tools:
|
|
|
|
|
|
logger.info(f"MCP增强: 加载了 {len(tools)} 个工具")
|
|
|
|
|
|
result["mcp_enhanced"] = True
|
|
|
|
|
|
except MCPToolServiceError as e:
|
|
|
|
|
|
logger.error(f"获取MCP工具失败,降级为普通生成: {e}")
|
|
|
|
|
|
tools = None
|
|
|
|
|
|
|
|
|
|
|
|
# 2. 工具调用循环
|
|
|
|
|
|
conversation_history = [
|
|
|
|
|
|
{"role": "user", "content": prompt}
|
|
|
|
|
|
]
|
|
|
|
|
|
|
|
|
|
|
|
for round_num in range(max_tool_rounds):
|
|
|
|
|
|
logger.info(f"MCP工具调用轮次: {round_num + 1}/{max_tool_rounds}")
|
|
|
|
|
|
|
|
|
|
|
|
# 调用AI
|
|
|
|
|
|
ai_response = await self.generate_text(
|
|
|
|
|
|
prompt=conversation_history[-1]["content"],
|
|
|
|
|
|
tools=tools if round_num == 0 else None, # 只在第一轮传递工具
|
|
|
|
|
|
tool_choice=tool_choice if round_num == 0 else None,
|
|
|
|
|
|
**kwargs
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 检查是否有工具调用
|
|
|
|
|
|
tool_calls = ai_response.get("tool_calls", [])
|
|
|
|
|
|
|
|
|
|
|
|
if not tool_calls:
|
|
|
|
|
|
# AI返回最终内容
|
|
|
|
|
|
result["content"] = ai_response.get("content", "")
|
|
|
|
|
|
result["finish_reason"] = ai_response.get("finish_reason", "stop")
|
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
|
|
# 3. 执行工具调用
|
|
|
|
|
|
logger.info(f"AI请求调用 {len(tool_calls)} 个工具")
|
|
|
|
|
|
|
|
|
|
|
|
try:
|
|
|
|
|
|
tool_results = await mcp_tool_service.execute_tool_calls(
|
|
|
|
|
|
user_id=user_id,
|
|
|
|
|
|
tool_calls=tool_calls,
|
|
|
|
|
|
db_session=db_session
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 记录使用的工具
|
|
|
|
|
|
for tool_call in tool_calls:
|
|
|
|
|
|
tool_name = tool_call["function"]["name"]
|
|
|
|
|
|
if tool_name not in result["tools_used"]:
|
|
|
|
|
|
result["tools_used"].append(tool_name)
|
|
|
|
|
|
|
|
|
|
|
|
result["tool_calls_made"] += len(tool_calls)
|
|
|
|
|
|
|
|
|
|
|
|
# 4. 构建工具上下文
|
|
|
|
|
|
tool_context = await mcp_tool_service.build_tool_context(
|
|
|
|
|
|
tool_results,
|
|
|
|
|
|
format="markdown"
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 5. 更新对话历史
|
|
|
|
|
|
conversation_history.append({
|
|
|
|
|
|
"role": "assistant",
|
|
|
|
|
|
"content": ai_response.get("content", ""),
|
|
|
|
|
|
"tool_calls": tool_calls
|
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
|
|
for tool_result in tool_results:
|
|
|
|
|
|
conversation_history.append({
|
|
|
|
|
|
"role": "tool",
|
|
|
|
|
|
"tool_call_id": tool_result["tool_call_id"],
|
|
|
|
|
|
"content": tool_result["content"]
|
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
|
|
# 6. 构建下一轮提示
|
|
|
|
|
|
next_prompt = (
|
|
|
|
|
|
f"{prompt}\n\n"
|
|
|
|
|
|
f"{tool_context}\n\n"
|
|
|
|
|
|
f"请基于以上工具查询结果,继续完成任务。"
|
|
|
|
|
|
)
|
|
|
|
|
|
conversation_history.append({
|
|
|
|
|
|
"role": "user",
|
|
|
|
|
|
"content": next_prompt
|
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"执行MCP工具失败: {e}", exc_info=True)
|
|
|
|
|
|
# 降级:返回当前AI响应
|
|
|
|
|
|
result["content"] = ai_response.get("content", "")
|
|
|
|
|
|
result["finish_reason"] = "tool_error"
|
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
|
|
else:
|
|
|
|
|
|
# 达到最大轮次
|
2025-11-24 20:42:09 +08:00
|
|
|
|
logger.info(f"达到MCP最大调用轮次 {max_tool_rounds}")
|
2025-11-07 22:14:20 +08:00
|
|
|
|
result["content"] = conversation_history[-1].get("content", "")
|
|
|
|
|
|
result["finish_reason"] = "max_rounds"
|
|
|
|
|
|
|
|
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
|
|
|
async def generate_text_stream_with_mcp(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
user_id: str,
|
|
|
|
|
|
db_session,
|
|
|
|
|
|
enable_mcp: bool = True,
|
|
|
|
|
|
mcp_planning_prompt: Optional[str] = None,
|
|
|
|
|
|
**kwargs
|
|
|
|
|
|
) -> AsyncGenerator[str, None]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
支持MCP工具的AI流式文本生成(两阶段模式)
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
prompt: 用户提示词
|
|
|
|
|
|
user_id: 用户ID
|
|
|
|
|
|
db_session: 数据库会话
|
|
|
|
|
|
enable_mcp: 是否启用MCP增强
|
|
|
|
|
|
mcp_planning_prompt: MCP规划阶段的提示词(可选)
|
|
|
|
|
|
**kwargs: 其他AI参数
|
|
|
|
|
|
|
|
|
|
|
|
Yields:
|
|
|
|
|
|
流式文本chunk
|
|
|
|
|
|
"""
|
|
|
|
|
|
from app.services.mcp_tool_service import mcp_tool_service
|
|
|
|
|
|
|
|
|
|
|
|
# 阶段1: 工具调用阶段(非流式)
|
|
|
|
|
|
enhanced_prompt = prompt
|
|
|
|
|
|
|
|
|
|
|
|
if enable_mcp:
|
|
|
|
|
|
try:
|
|
|
|
|
|
# 获取MCP工具
|
|
|
|
|
|
tools = await mcp_tool_service.get_user_enabled_tools(
|
|
|
|
|
|
user_id=user_id,
|
|
|
|
|
|
db_session=db_session
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
if tools:
|
|
|
|
|
|
logger.info(f"MCP增强(流式): 加载了 {len(tools)} 个工具")
|
|
|
|
|
|
|
|
|
|
|
|
# 使用规划提示让AI决定需要查询什么
|
|
|
|
|
|
if not mcp_planning_prompt:
|
|
|
|
|
|
mcp_planning_prompt = (
|
|
|
|
|
|
f"任务: {prompt}\n\n"
|
|
|
|
|
|
f"请分析这个任务,决定是否需要查询外部信息。"
|
|
|
|
|
|
f"如果需要,请调用相应的工具获取信息。"
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 非流式调用获取工具结果
|
|
|
|
|
|
planning_result = await self.generate_text_with_mcp(
|
|
|
|
|
|
prompt=mcp_planning_prompt,
|
|
|
|
|
|
user_id=user_id,
|
|
|
|
|
|
db_session=db_session,
|
|
|
|
|
|
enable_mcp=True,
|
|
|
|
|
|
max_tool_rounds=2,
|
|
|
|
|
|
tool_choice="auto",
|
|
|
|
|
|
**kwargs
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 如果有工具调用,将结果融入提示
|
|
|
|
|
|
if planning_result["tool_calls_made"] > 0:
|
|
|
|
|
|
enhanced_prompt = (
|
|
|
|
|
|
f"{prompt}\n\n"
|
|
|
|
|
|
f"【参考资料】\n"
|
|
|
|
|
|
f"{planning_result.get('content', '')}"
|
|
|
|
|
|
)
|
|
|
|
|
|
logger.info(
|
|
|
|
|
|
f"MCP工具规划完成,调用了 "
|
|
|
|
|
|
f"{planning_result['tool_calls_made']} 次工具"
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"MCP工具规划失败,使用原始提示: {e}")
|
|
|
|
|
|
|
|
|
|
|
|
# 阶段2: 内容生成阶段(流式)
|
|
|
|
|
|
async for chunk in self.generate_text_stream(
|
|
|
|
|
|
prompt=enhanced_prompt,
|
|
|
|
|
|
**kwargs
|
|
|
|
|
|
):
|
|
|
|
|
|
yield chunk
|
2025-12-14 15:21:52 +08:00
|
|
|
|
|
|
|
|
|
|
# ========== JSON 统一调用和自动重试 ==========
|
|
|
|
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
|
|
def _clean_json_response(text: str) -> str:
|
|
|
|
|
|
"""
|
|
|
|
|
|
清洗 AI 返回的 JSON 响应
|
|
|
|
|
|
|
|
|
|
|
|
去除常见的格式问题:
|
|
|
|
|
|
- markdown 代码块标记 (```json ```)
|
|
|
|
|
|
- 前后空白字符
|
|
|
|
|
|
- 注释文字
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
text: AI 返回的原始文本
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
清洗后的 JSON 字符串
|
|
|
|
|
|
"""
|
|
|
|
|
|
if not text:
|
|
|
|
|
|
return text
|
|
|
|
|
|
|
|
|
|
|
|
# 去除 markdown 代码块标记
|
|
|
|
|
|
text = re.sub(r'^```json\s*\n?', '', text, flags=re.MULTILINE | re.IGNORECASE)
|
|
|
|
|
|
text = re.sub(r'^```\s*\n?', '', text, flags=re.MULTILINE)
|
|
|
|
|
|
text = re.sub(r'\n?```\s*$', '', text, flags=re.MULTILINE)
|
|
|
|
|
|
|
|
|
|
|
|
# 去除前后空白
|
|
|
|
|
|
text = text.strip()
|
|
|
|
|
|
|
|
|
|
|
|
# 尝试提取第一个完整的 JSON 对象或数组
|
|
|
|
|
|
# 查找第一个 { 或 [
|
|
|
|
|
|
start_idx = -1
|
|
|
|
|
|
for i, char in enumerate(text):
|
|
|
|
|
|
if char in ('{', '['):
|
|
|
|
|
|
start_idx = i
|
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
|
|
if start_idx == -1:
|
|
|
|
|
|
return text
|
|
|
|
|
|
|
|
|
|
|
|
# 从第一个括号开始提取
|
|
|
|
|
|
text = text[start_idx:]
|
|
|
|
|
|
|
|
|
|
|
|
# 查找匹配的结束括号
|
|
|
|
|
|
bracket_stack = []
|
|
|
|
|
|
end_idx = -1
|
|
|
|
|
|
in_string = False
|
|
|
|
|
|
escape_next = False
|
|
|
|
|
|
|
|
|
|
|
|
for i, char in enumerate(text):
|
|
|
|
|
|
if escape_next:
|
|
|
|
|
|
escape_next = False
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
if char == '\\':
|
|
|
|
|
|
escape_next = True
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
if char == '"':
|
|
|
|
|
|
in_string = not in_string
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
if in_string:
|
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
|
|
if char in ('{', '['):
|
|
|
|
|
|
bracket_stack.append(char)
|
|
|
|
|
|
elif char == '}':
|
|
|
|
|
|
if bracket_stack and bracket_stack[-1] == '{':
|
|
|
|
|
|
bracket_stack.pop()
|
|
|
|
|
|
if not bracket_stack:
|
|
|
|
|
|
end_idx = i + 1
|
|
|
|
|
|
break
|
|
|
|
|
|
elif char == ']':
|
|
|
|
|
|
if bracket_stack and bracket_stack[-1] == '[':
|
|
|
|
|
|
bracket_stack.pop()
|
|
|
|
|
|
if not bracket_stack:
|
|
|
|
|
|
end_idx = i + 1
|
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
|
|
if end_idx > 0:
|
|
|
|
|
|
return text[:end_idx]
|
|
|
|
|
|
|
|
|
|
|
|
return text
|
|
|
|
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
|
|
def _add_json_format_hint(original_prompt: str, failed_response: str, attempt: int) -> str:
|
|
|
|
|
|
"""
|
|
|
|
|
|
重试时添加格式纠正提示
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
original_prompt: 原始提示词
|
|
|
|
|
|
failed_response: 上次失败的响应(截断显示)
|
|
|
|
|
|
attempt: 当前尝试次数
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
增强后的提示词
|
|
|
|
|
|
"""
|
|
|
|
|
|
error_preview = failed_response[:300] if failed_response else "无响应"
|
|
|
|
|
|
|
|
|
|
|
|
return f"""{original_prompt}
|
|
|
|
|
|
|
|
|
|
|
|
⚠️ 【第 {attempt} 次重试】上一次返回格式错误,请严格遵守以下规则:
|
|
|
|
|
|
|
|
|
|
|
|
🔴 格式要求(必须严格遵守):
|
|
|
|
|
|
1. 只返回纯 JSON 对象或数组,不要有任何其他文字
|
|
|
|
|
|
2. 不要使用 ```json``` 或 ``` 包裹 JSON
|
|
|
|
|
|
3. 不要添加任何解释、说明或注释
|
|
|
|
|
|
4. 确保 JSON 格式完全正确:
|
|
|
|
|
|
- 所有括号必须匹配 {{}} []
|
|
|
|
|
|
- 所有字符串必须用双引号 ""
|
|
|
|
|
|
- 键值对用冒号分隔 :
|
|
|
|
|
|
- 多个元素用逗号分隔 ,
|
|
|
|
|
|
- 不要有多余的逗号
|
|
|
|
|
|
|
|
|
|
|
|
❌ 上一次的错误返回示例:
|
|
|
|
|
|
{error_preview}...
|
|
|
|
|
|
|
|
|
|
|
|
✅ 请现在重新生成正确的 JSON 格式内容。"""
|
|
|
|
|
|
|
|
|
|
|
|
async def call_with_json_retry(
|
|
|
|
|
|
self,
|
|
|
|
|
|
prompt: str,
|
|
|
|
|
|
system_prompt: Optional[str] = None,
|
|
|
|
|
|
max_retries: int = 3,
|
|
|
|
|
|
temperature: Optional[float] = None,
|
|
|
|
|
|
max_tokens: Optional[int] = None,
|
|
|
|
|
|
provider: Optional[str] = None,
|
|
|
|
|
|
model: Optional[str] = None,
|
|
|
|
|
|
expected_type: Optional[str] = None # "object" 或 "array"
|
|
|
|
|
|
) -> Dict[str, Any] | List[Dict[str, Any]]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
统一的 JSON 调用方法,自动重试和格式修复
|
|
|
|
|
|
|
|
|
|
|
|
这是一个专门用于需要返回 JSON 格式的 AI 调用封装,会自动:
|
|
|
|
|
|
1. 清洗 AI 返回的内容(去除 markdown 标记等)
|
|
|
|
|
|
2. 解析 JSON 并验证格式
|
|
|
|
|
|
3. 失败时自动重试,并在提示词中添加纠正指引
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
prompt: 用户提示词
|
|
|
|
|
|
system_prompt: 系统提示词(可选)
|
|
|
|
|
|
max_retries: 最大重试次数,默认 3 次
|
|
|
|
|
|
temperature: 温度参数(可选,使用默认值)
|
|
|
|
|
|
max_tokens: 最大 token 数(可选,使用默认值)
|
|
|
|
|
|
provider: AI 提供商(可选,使用默认值)
|
|
|
|
|
|
model: 模型名称(可选,使用默认值)
|
|
|
|
|
|
expected_type: 期望的 JSON 类型 "object" 或 "array"(可选,用于额外验证)
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
解析后的 JSON 对象(dict)或数组(list)
|
|
|
|
|
|
|
|
|
|
|
|
Raises:
|
|
|
|
|
|
ValueError: 重试次数用尽仍未获得有效 JSON
|
|
|
|
|
|
|
|
|
|
|
|
Examples:
|
|
|
|
|
|
>>> # 获取 JSON 对象
|
|
|
|
|
|
>>> result = await ai_service.call_with_json_retry(
|
|
|
|
|
|
... prompt="生成一个角色",
|
|
|
|
|
|
... expected_type="object"
|
|
|
|
|
|
... )
|
|
|
|
|
|
>>> print(result["name"])
|
|
|
|
|
|
|
|
|
|
|
|
>>> # 获取 JSON 数组
|
|
|
|
|
|
>>> results = await ai_service.call_with_json_retry(
|
|
|
|
|
|
... prompt="生成3个角色",
|
|
|
|
|
|
... expected_type="array"
|
|
|
|
|
|
... )
|
|
|
|
|
|
>>> print(len(results))
|
|
|
|
|
|
"""
|
|
|
|
|
|
last_error = None
|
|
|
|
|
|
last_response = ""
|
|
|
|
|
|
|
|
|
|
|
|
for attempt in range(1, max_retries + 1):
|
|
|
|
|
|
try:
|
|
|
|
|
|
logger.info(f"🔄 JSON 调用尝试 {attempt}/{max_retries}")
|
|
|
|
|
|
|
|
|
|
|
|
# 第一次使用原始提示词,之后使用增强提示词
|
|
|
|
|
|
current_prompt = prompt if attempt == 1 else self._add_json_format_hint(
|
|
|
|
|
|
prompt, last_response, attempt
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# 调用 AI 生成内容
|
|
|
|
|
|
if provider == "openai" and self.openai_client:
|
|
|
|
|
|
response = await self._generate_openai(
|
|
|
|
|
|
prompt=current_prompt,
|
|
|
|
|
|
model=model or self.default_model,
|
|
|
|
|
|
temperature=temperature or self.default_temperature,
|
|
|
|
|
|
max_tokens=max_tokens or self.default_max_tokens,
|
|
|
|
|
|
system_prompt=system_prompt
|
|
|
|
|
|
)
|
|
|
|
|
|
elif provider == "anthropic" and self.anthropic_client:
|
|
|
|
|
|
response = await self._generate_anthropic(
|
|
|
|
|
|
prompt=current_prompt,
|
|
|
|
|
|
model=model or self.default_model,
|
|
|
|
|
|
temperature=temperature or self.default_temperature,
|
|
|
|
|
|
max_tokens=max_tokens or self.default_max_tokens,
|
|
|
|
|
|
system_prompt=system_prompt
|
|
|
|
|
|
)
|
|
|
|
|
|
else:
|
|
|
|
|
|
# 使用默认提供商
|
|
|
|
|
|
if self.api_provider == "openai":
|
|
|
|
|
|
response = await self._generate_openai(
|
|
|
|
|
|
prompt=current_prompt,
|
|
|
|
|
|
model=model or self.default_model,
|
|
|
|
|
|
temperature=temperature or self.default_temperature,
|
|
|
|
|
|
max_tokens=max_tokens or self.default_max_tokens,
|
|
|
|
|
|
system_prompt=system_prompt
|
|
|
|
|
|
)
|
|
|
|
|
|
else:
|
|
|
|
|
|
response = await self._generate_anthropic(
|
|
|
|
|
|
prompt=current_prompt,
|
|
|
|
|
|
model=model or self.default_model,
|
|
|
|
|
|
temperature=temperature or self.default_temperature,
|
|
|
|
|
|
max_tokens=max_tokens or self.default_max_tokens,
|
|
|
|
|
|
system_prompt=system_prompt
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
last_response = response
|
|
|
|
|
|
|
|
|
|
|
|
# 清洗响应内容
|
|
|
|
|
|
cleaned = self._clean_json_response(response)
|
|
|
|
|
|
logger.debug(f"清洗后的内容: {cleaned[:200]}...")
|
|
|
|
|
|
|
|
|
|
|
|
# 解析 JSON
|
|
|
|
|
|
try:
|
|
|
|
|
|
data = json.loads(cleaned)
|
|
|
|
|
|
except json.JSONDecodeError as e:
|
|
|
|
|
|
logger.warning(f"⚠️ JSON 解析失败: {e}")
|
|
|
|
|
|
logger.debug(f"原始响应: {response[:500]}")
|
|
|
|
|
|
logger.debug(f"清洗后: {cleaned[:500]}")
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
# 可选:验证 JSON 类型
|
|
|
|
|
|
if expected_type:
|
|
|
|
|
|
if expected_type == "object" and not isinstance(data, dict):
|
|
|
|
|
|
raise ValueError(f"期望 JSON 对象,但得到 {type(data).__name__}")
|
|
|
|
|
|
elif expected_type == "array" and not isinstance(data, list):
|
|
|
|
|
|
raise ValueError(f"期望 JSON 数组,但得到 {type(data).__name__}")
|
|
|
|
|
|
|
|
|
|
|
|
logger.info(f"✅ JSON 解析成功 (尝试 {attempt}/{max_retries})")
|
|
|
|
|
|
if isinstance(data, dict):
|
|
|
|
|
|
logger.info(f" 返回对象,包含 {len(data)} 个键")
|
|
|
|
|
|
elif isinstance(data, list):
|
|
|
|
|
|
logger.info(f" 返回数组,包含 {len(data)} 个元素")
|
|
|
|
|
|
|
|
|
|
|
|
return data
|
|
|
|
|
|
|
|
|
|
|
|
except json.JSONDecodeError as e:
|
|
|
|
|
|
last_error = e
|
|
|
|
|
|
logger.warning(f"⚠️ 第 {attempt} 次尝试失败: JSON 解析错误")
|
|
|
|
|
|
logger.warning(f" 错误位置: {e.msg} at line {e.lineno} column {e.colno}")
|
|
|
|
|
|
|
|
|
|
|
|
if attempt < max_retries:
|
|
|
|
|
|
logger.info(f" 准备第 {attempt + 1} 次重试...")
|
|
|
|
|
|
continue
|
|
|
|
|
|
else:
|
|
|
|
|
|
logger.error(f"❌ JSON 解析失败,已达到最大重试次数 {max_retries}")
|
|
|
|
|
|
logger.error(f" 最后的响应内容:\n{last_response[:1000]}")
|
|
|
|
|
|
raise ValueError(
|
|
|
|
|
|
f"AI 返回内容无法解析为 JSON,已重试 {max_retries} 次。\n"
|
|
|
|
|
|
f"最后错误: {e}\n"
|
|
|
|
|
|
f"响应预览: {last_response[:200]}..."
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
except ValueError as e:
|
|
|
|
|
|
last_error = e
|
|
|
|
|
|
logger.warning(f"⚠️ 第 {attempt} 次尝试失败: {e}")
|
|
|
|
|
|
|
|
|
|
|
|
if attempt < max_retries:
|
|
|
|
|
|
logger.info(f" 准备第 {attempt + 1} 次重试...")
|
|
|
|
|
|
continue
|
|
|
|
|
|
else:
|
|
|
|
|
|
logger.error(f"❌ 验证失败,已达到最大重试次数 {max_retries}")
|
|
|
|
|
|
raise ValueError(
|
|
|
|
|
|
f"AI 返回的 JSON 格式不符合要求,已重试 {max_retries} 次。\n"
|
|
|
|
|
|
f"错误: {e}"
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"❌ 第 {attempt} 次调用出现未预期错误: {type(e).__name__}: {e}")
|
|
|
|
|
|
if attempt < max_retries:
|
|
|
|
|
|
logger.info(f" 准备第 {attempt + 1} 次重试...")
|
|
|
|
|
|
last_error = e
|
|
|
|
|
|
continue
|
|
|
|
|
|
else:
|
|
|
|
|
|
raise
|
|
|
|
|
|
|
|
|
|
|
|
# 理论上不会到达这里,但以防万一
|
|
|
|
|
|
raise ValueError(f"JSON 调用失败,已重试 {max_retries} 次。最后错误: {last_error}")
|
2025-10-30 11:14:43 +08:00
|
|
|
|
|
|
|
|
|
|
|
2025-11-03 15:28:51 +08:00
|
|
|
|
# 创建全局AI服务实例
|
2025-10-30 16:53:50 +08:00
|
|
|
|
ai_service = AIService()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def create_user_ai_service(
|
|
|
|
|
|
api_provider: str,
|
|
|
|
|
|
api_key: str,
|
|
|
|
|
|
api_base_url: str,
|
|
|
|
|
|
model_name: str,
|
|
|
|
|
|
temperature: float,
|
|
|
|
|
|
max_tokens: int
|
|
|
|
|
|
) -> AIService:
|
|
|
|
|
|
"""
|
|
|
|
|
|
根据用户设置创建AI服务实例
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
api_provider: API提供商
|
|
|
|
|
|
api_key: API密钥
|
|
|
|
|
|
api_base_url: API基础URL
|
|
|
|
|
|
model_name: 模型名称
|
|
|
|
|
|
temperature: 温度参数
|
|
|
|
|
|
max_tokens: 最大tokens
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
AIService实例
|
|
|
|
|
|
"""
|
|
|
|
|
|
return AIService(
|
|
|
|
|
|
api_provider=api_provider,
|
|
|
|
|
|
api_key=api_key,
|
|
|
|
|
|
api_base_url=api_base_url,
|
|
|
|
|
|
default_model=model_name,
|
|
|
|
|
|
default_temperature=temperature,
|
|
|
|
|
|
default_max_tokens=max_tokens
|
|
|
|
|
|
)
|