update:1.新增统一的JSON清洗和重试方法，避免AI响应json格式错误 2.重构提示词模板命名，优化大纲章节初始化提示词 3.移除布冯冗余代码，提高代码复用性 4.优化系统默认写作风格预设提示词和规则

2025-12-14 15:21:52 +08:00
parent 86b73e85fb
commit 24b0a09b43
11 changed files with 633 additions and 1851 deletions
@@ -8,9 +8,15 @@ from app.mcp.adapters import UniversalMCPAdapter, PromptInjectionAdapter
 import httpx
 import json
 import hashlib
+import re
+import asyncio

 logger = get_logger(__name__)

+# 全局请求限流器（使用信号量控制并发数）
+_global_semaphore = asyncio.Semaphore(5)  # 最多5个并发请求
+_request_delay = 0.2  # 请求间隔200ms
+
 # 全局HTTP客户端池（按配置复用）
 _http_client_pool: Dict[str, httpx.AsyncClient] = {}
 _client_pool_lock = False  # 简单的锁标志
@@ -308,7 +314,7 @@ class AIService:
        max_tokens: int,
        system_prompt: Optional[str]
    ) -> str:
-        """使用OpenAI生成文本"""
+        """使用OpenAI生成文本（带限流和重试）"""
        if not self.openai_http_client:
            raise ValueError("OpenAI客户端未初始化，请检查API key配置")
        
@@ -317,84 +323,118 @@ class AIService:
            messages.append({"role": "system", "content": system_prompt})
        messages.append({"role": "user", "content": prompt})
        
-        try:
-            logger.info(f"🔵 开始调用OpenAI API（直接HTTP请求）")
-            logger.info(f"  - 模型: {model}")
-            logger.info(f"  - 温度: {temperature}")
-            logger.info(f"  - 最大tokens: {max_tokens}")
-            logger.info(f"  - Prompt长度: {len(prompt)} 字符")
-            logger.info(f"  - 消息数量: {len(messages)}")
+        # 使用全局信号量限流
+        async with _global_semaphore:
+            # 请求间隔
+            await asyncio.sleep(_request_delay)
            
-            url = f"{self.openai_base_url}/chat/completions"
-            headers = {
-                "Authorization": f"Bearer {self.openai_api_key}",
-                "Content-Type": "application/json"
-            }
-            payload = {
-                "model": model,
-                "messages": messages,
-                "temperature": temperature,
-                "max_tokens": max_tokens
-            }
-            
-            logger.debug(f"  - 请求URL: {url}")
-            logger.debug(f"  - 请求头: Authorization=Bearer ***")
-            
-            response = await self.openai_http_client.post(url, headers=headers, json=payload)
-            response.raise_for_status()
-            
-            data = response.json()
-            
-            logger.info(f"✅ OpenAI API调用成功")
-            logger.info(f"  - 响应ID: {data.get('id', 'N/A')}")
-            logger.info(f"  - 选项数量: {len(data.get('choices', []))}")
-            logger.debug(f"  - 完整API响应: {data}")
-            
-            if not data.get('choices'):
-                logger.error("❌ OpenAI返回的choices为空")
-                raise ValueError("API返回的响应格式错误：choices字段为空")
-            
-            choice = data['choices'][0]
-            message = choice.get('message', {})
-            finish_reason = choice.get('finish_reason')
-            
-            # DeepSeek R1特殊处理：只使用content（最终答案），忽略reasoning_content（思考过程）
-            # reasoning_content是AI的思考过程，不是我们需要的JSON结果
-            content = message.get('content', '')
-            
-            # 检查是否因达到长度限制而截断
-            if finish_reason == 'length':
-                logger.warning(f"⚠️  响应因达到max_tokens限制而被截断")
-                logger.warning(f"  - 当前max_tokens: {max_tokens}")
-                logger.warning(f"  - 建议: 增加max_tokens参数（推荐2000+）")
-            
-            if content:
-                logger.info(f"  - 返回内容长度: {len(content)} 字符")
-                logger.info(f"  - 完成原因: {finish_reason}")
-                logger.info(f"  - 返回内容预览（前200字符）: {content[:200]}")
-                return content
-            else:
-                logger.error("❌ AI返回了空内容")
-                logger.error(f"  - 完整响应: {data}")
-                logger.error(f"  - 完成原因: {finish_reason}")
+            # 重试机制
+            max_retries = 3
+            for attempt in range(max_retries):
+                try:
+                    if attempt > 0:
+                        wait_time = min(2 ** attempt, 10)  # 指数退避
+                        logger.warning(f"⚠️ OpenAI API调用失败，{wait_time}秒后重试（第{attempt + 1}/{max_retries}次）")
+                        await asyncio.sleep(wait_time)
+                    
+                    logger.info(f"🔵 开始调用OpenAI API（尝试 {attempt + 1}/{max_retries}）")
+                    logger.info(f"  - 模型: {model}")
+                    logger.info(f"  - 温度: {temperature}")
+                    logger.info(f"  - 最大tokens: {max_tokens}")
+                    logger.info(f"  - Prompt长度: {len(prompt)} 字符")
+                    logger.info(f"  - 消息数量: {len(messages)}")
+                    
+                    url = f"{self.openai_base_url}/chat/completions"
+                    headers = {
+                        "Authorization": f"Bearer {self.openai_api_key}",
+                        "Content-Type": "application/json"
+                    }
+                    payload = {
+                        "model": model,
+                        "messages": messages,
+                        "temperature": temperature,
+                        "max_tokens": max_tokens
+                    }
+                    
+                    logger.debug(f"  - 请求URL: {url}")
+                    logger.debug(f"  - 请求头: Authorization=Bearer ***")
+                    
+                    response = await self.openai_http_client.post(url, headers=headers, json=payload)
+                    response.raise_for_status()
+                    
+                    data = response.json()
+                    
+                    logger.info(f"✅ OpenAI API调用成功")
+                    logger.info(f"  - 响应ID: {data.get('id', 'N/A')}")
+                    logger.info(f"  - 选项数量: {len(data.get('choices', []))}")
+                    logger.debug(f"  - 完整API响应: {data}")
+                    
+                    if not data.get('choices'):
+                        logger.error("❌ OpenAI返回的choices为空")
+                        raise ValueError("API返回的响应格式错误：choices字段为空")
+                    
+                    choice = data['choices'][0]
+                    message = choice.get('message', {})
+                    finish_reason = choice.get('finish_reason')
+                    
+                    # DeepSeek R1特殊处理：只使用content（最终答案），忽略reasoning_content（思考过程）
+                    # reasoning_content是AI的思考过程，不是我们需要的JSON结果
+                    content = message.get('content', '')
+                    
+                    # 检查是否因达到长度限制而截断
+                    if finish_reason == 'length':
+                        logger.warning(f"⚠️  响应因达到max_tokens限制而被截断")
+                        logger.warning(f"  - 当前max_tokens: {max_tokens}")
+                        logger.warning(f"  - 建议: 增加max_tokens参数（推荐2000+）")
+                    
+                    if content:
+                        logger.info(f"  - 返回内容长度: {len(content)} 字符")
+                        logger.info(f"  - 完成原因: {finish_reason}")
+                        logger.info(f"  - 返回内容预览（前200字符）: {content[:200]}")
+                        return content
+                    else:
+                        logger.error("❌ AI返回了空内容")
+                        logger.error(f"  - 完整响应: {data}")
+                        logger.error(f"  - 完成原因: {finish_reason}")
+                        
+                        # 提供更详细的错误信息
+                        if finish_reason == 'length':
+                            raise ValueError(f"AI响应被截断且无有效内容。请增加max_tokens参数（当前: {max_tokens}，建议: 2000+）")
+                        else:
+                            raise ValueError(f"AI返回了空内容（finish_reason: {finish_reason}），请检查API配置或稍后重试")
                
-                # 提供更详细的错误信息
-                if finish_reason == 'length':
-                    raise ValueError(f"AI响应被截断且无有效内容。请增加max_tokens参数（当前: {max_tokens}，建议: 2000+）")
-                else:
-                    raise ValueError(f"AI返回了空内容（finish_reason: {finish_reason}），请检查API配置或稍后重试")
-            
-        except httpx.HTTPStatusError as e:
-            logger.error(f"❌ OpenAI API调用失败 (HTTP {e.response.status_code})")
-            logger.error(f"  - 错误信息: {e.response.text}")
-            logger.error(f"  - 模型: {model}")
-            raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
-        except Exception as e:
-            logger.error(f"❌ OpenAI API调用失败")
-            logger.error(f"  - 错误类型: {type(e).__name__}")
-            logger.error(f"  - 错误信息: {str(e)}")
-            logger.error(f"  - 模型: {model}")
-            raise
+                except httpx.ConnectError as e:
+                    logger.error(f"❌ OpenAI API连接失败 (尝试 {attempt + 1}/{max_retries}): {str(e)}")
+                    if attempt == max_retries - 1:
+                        raise Exception(f"连接失败，已重试{max_retries}次。请检查网络连接或API地址: {str(e)}")
+                    continue
+                    
+                except httpx.HTTPStatusError as e:
+                    logger.error(f"❌ OpenAI API调用失败 (HTTP {e.response.status_code}, 尝试 {attempt + 1}/{max_retries})")
+                    logger.error(f"  - 错误信息: {e.response.text}")
+                    
+                    # 某些错误不需要重试（如401、403）
+                    if e.response.status_code in [401, 403, 404]:
+                        raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
+                    
+                    if attempt == max_retries - 1:
+                        raise Exception(f"API返回错误 ({e.response.status_code}): {e.response.text}")
+                    continue
+                    
+                except httpx.TimeoutException as e:
+                    logger.error(f"❌ OpenAI API超时 (尝试 {attempt + 1}/{max_retries})")
+                    if attempt == max_retries - 1:
+                        raise Exception(f"API请求超时，已重试{max_retries}次: {str(e)}")
+                    continue
+                    
+                except Exception as e:
+                    logger.error(f"❌ OpenAI API调用失败 (尝试 {attempt + 1}/{max_retries})")
+                    logger.error(f"  - 错误类型: {type(e).__name__}")
+                    logger.error(f"  - 错误信息: {str(e)}")
+                    
+                    if attempt == max_retries - 1:
+                        raise
+                    continue
    

    async def _generate_openai_with_tools(
@@ -1044,6 +1084,297 @@ class AIService:
            **kwargs
        ):
            yield chunk
+    
+    # ========== JSON 统一调用和自动重试 ==========
+    
+    @staticmethod
+    def _clean_json_response(text: str) -> str:
+        """
+        清洗 AI 返回的 JSON 响应
+        
+        去除常见的格式问题：
+        - markdown 代码块标记 (```json ```)
+        - 前后空白字符
+        - 注释文字
+        
+        Args:
+            text: AI 返回的原始文本
+            
+        Returns:
+            清洗后的 JSON 字符串
+        """
+        if not text:
+            return text
+        
+        # 去除 markdown 代码块标记
+        text = re.sub(r'^```json\s*\n?', '', text, flags=re.MULTILINE | re.IGNORECASE)
+        text = re.sub(r'^```\s*\n?', '', text, flags=re.MULTILINE)
+        text = re.sub(r'\n?```\s*$', '', text, flags=re.MULTILINE)
+        
+        # 去除前后空白
+        text = text.strip()
+        
+        # 尝试提取第一个完整的 JSON 对象或数组
+        # 查找第一个 { 或 [
+        start_idx = -1
+        for i, char in enumerate(text):
+            if char in ('{', '['):
+                start_idx = i
+                break
+        
+        if start_idx == -1:
+            return text
+        
+        # 从第一个括号开始提取
+        text = text[start_idx:]
+        
+        # 查找匹配的结束括号
+        bracket_stack = []
+        end_idx = -1
+        in_string = False
+        escape_next = False
+        
+        for i, char in enumerate(text):
+            if escape_next:
+                escape_next = False
+                continue
+            
+            if char == '\\':
+                escape_next = True
+                continue
+            
+            if char == '"':
+                in_string = not in_string
+                continue
+            
+            if in_string:
+                continue
+            
+            if char in ('{', '['):
+                bracket_stack.append(char)
+            elif char == '}':
+                if bracket_stack and bracket_stack[-1] == '{':
+                    bracket_stack.pop()
+                    if not bracket_stack:
+                        end_idx = i + 1
+                        break
+            elif char == ']':
+                if bracket_stack and bracket_stack[-1] == '[':
+                    bracket_stack.pop()
+                    if not bracket_stack:
+                        end_idx = i + 1
+                        break
+        
+        if end_idx > 0:
+            return text[:end_idx]
+        
+        return text
+    
+    @staticmethod
+    def _add_json_format_hint(original_prompt: str, failed_response: str, attempt: int) -> str:
+        """
+        重试时添加格式纠正提示
+        
+        Args:
+            original_prompt: 原始提示词
+            failed_response: 上次失败的响应（截断显示）
+            attempt: 当前尝试次数
+            
+        Returns:
+            增强后的提示词
+        """
+        error_preview = failed_response[:300] if failed_response else "无响应"
+        
+        return f"""{original_prompt}
+
+⚠️ 【第 {attempt} 次重试】上一次返回格式错误，请严格遵守以下规则：
+
+🔴 格式要求（必须严格遵守）：
+1. 只返回纯 JSON 对象或数组，不要有任何其他文字
+2. 不要使用 ```json``` 或 ``` 包裹 JSON
+3. 不要添加任何解释、说明或注释
+4. 确保 JSON 格式完全正确：
+   - 所有括号必须匹配 {{}} []
+   - 所有字符串必须用双引号 ""
+   - 键值对用冒号分隔 :
+   - 多个元素用逗号分隔 ,
+   - 不要有多余的逗号
+
+❌ 上一次的错误返回示例：
+{error_preview}...
+
+✅ 请现在重新生成正确的 JSON 格式内容。"""
+    
+    async def call_with_json_retry(
+        self,
+        prompt: str,
+        system_prompt: Optional[str] = None,
+        max_retries: int = 3,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+        provider: Optional[str] = None,
+        model: Optional[str] = None,
+        expected_type: Optional[str] = None  # "object" 或 "array"
+    ) -> Dict[str, Any] | List[Dict[str, Any]]:
+        """
+        统一的 JSON 调用方法，自动重试和格式修复
+        
+        这是一个专门用于需要返回 JSON 格式的 AI 调用封装，会自动：
+        1. 清洗 AI 返回的内容（去除 markdown 标记等）
+        2. 解析 JSON 并验证格式
+        3. 失败时自动重试，并在提示词中添加纠正指引
+        
+        Args:
+            prompt: 用户提示词
+            system_prompt: 系统提示词（可选）
+            max_retries: 最大重试次数，默认 3 次
+            temperature: 温度参数（可选，使用默认值）
+            max_tokens: 最大 token 数（可选，使用默认值）
+            provider: AI 提供商（可选，使用默认值）
+            model: 模型名称（可选，使用默认值）
+            expected_type: 期望的 JSON 类型 "object" 或 "array"（可选，用于额外验证）
+            
+        Returns:
+            解析后的 JSON 对象（dict）或数组（list）
+            
+        Raises:
+            ValueError: 重试次数用尽仍未获得有效 JSON
+            
+        Examples:
+            >>> # 获取 JSON 对象
+            >>> result = await ai_service.call_with_json_retry(
+            ...     prompt="生成一个角色",
+            ...     expected_type="object"
+            ... )
+            >>> print(result["name"])
+            
+            >>> # 获取 JSON 数组
+            >>> results = await ai_service.call_with_json_retry(
+            ...     prompt="生成3个角色",
+            ...     expected_type="array"
+            ... )
+            >>> print(len(results))
+        """
+        last_error = None
+        last_response = ""
+        
+        for attempt in range(1, max_retries + 1):
+            try:
+                logger.info(f"🔄 JSON 调用尝试 {attempt}/{max_retries}")
+                
+                # 第一次使用原始提示词，之后使用增强提示词
+                current_prompt = prompt if attempt == 1 else self._add_json_format_hint(
+                    prompt, last_response, attempt
+                )
+                
+                # 调用 AI 生成内容
+                if provider == "openai" and self.openai_client:
+                    response = await self._generate_openai(
+                        prompt=current_prompt,
+                        model=model or self.default_model,
+                        temperature=temperature or self.default_temperature,
+                        max_tokens=max_tokens or self.default_max_tokens,
+                        system_prompt=system_prompt
+                    )
+                elif provider == "anthropic" and self.anthropic_client:
+                    response = await self._generate_anthropic(
+                        prompt=current_prompt,
+                        model=model or self.default_model,
+                        temperature=temperature or self.default_temperature,
+                        max_tokens=max_tokens or self.default_max_tokens,
+                        system_prompt=system_prompt
+                    )
+                else:
+                    # 使用默认提供商
+                    if self.api_provider == "openai":
+                        response = await self._generate_openai(
+                            prompt=current_prompt,
+                            model=model or self.default_model,
+                            temperature=temperature or self.default_temperature,
+                            max_tokens=max_tokens or self.default_max_tokens,
+                            system_prompt=system_prompt
+                        )
+                    else:
+                        response = await self._generate_anthropic(
+                            prompt=current_prompt,
+                            model=model or self.default_model,
+                            temperature=temperature or self.default_temperature,
+                            max_tokens=max_tokens or self.default_max_tokens,
+                            system_prompt=system_prompt
+                        )
+                
+                last_response = response
+                
+                # 清洗响应内容
+                cleaned = self._clean_json_response(response)
+                logger.debug(f"清洗后的内容: {cleaned[:200]}...")
+                
+                # 解析 JSON
+                try:
+                    data = json.loads(cleaned)
+                except json.JSONDecodeError as e:
+                    logger.warning(f"⚠️ JSON 解析失败: {e}")
+                    logger.debug(f"原始响应: {response[:500]}")
+                    logger.debug(f"清洗后: {cleaned[:500]}")
+                    raise
+                
+                # 可选：验证 JSON 类型
+                if expected_type:
+                    if expected_type == "object" and not isinstance(data, dict):
+                        raise ValueError(f"期望 JSON 对象，但得到 {type(data).__name__}")
+                    elif expected_type == "array" and not isinstance(data, list):
+                        raise ValueError(f"期望 JSON 数组，但得到 {type(data).__name__}")
+                
+                logger.info(f"✅ JSON 解析成功 (尝试 {attempt}/{max_retries})")
+                if isinstance(data, dict):
+                    logger.info(f"   返回对象，包含 {len(data)} 个键")
+                elif isinstance(data, list):
+                    logger.info(f"   返回数组，包含 {len(data)} 个元素")
+                
+                return data
+                
+            except json.JSONDecodeError as e:
+                last_error = e
+                logger.warning(f"⚠️ 第 {attempt} 次尝试失败: JSON 解析错误")
+                logger.warning(f"   错误位置: {e.msg} at line {e.lineno} column {e.colno}")
+                
+                if attempt < max_retries:
+                    logger.info(f"   准备第 {attempt + 1} 次重试...")
+                    continue
+                else:
+                    logger.error(f"❌ JSON 解析失败，已达到最大重试次数 {max_retries}")
+                    logger.error(f"   最后的响应内容:\n{last_response[:1000]}")
+                    raise ValueError(
+                        f"AI 返回内容无法解析为 JSON，已重试 {max_retries} 次。\n"
+                        f"最后错误: {e}\n"
+                        f"响应预览: {last_response[:200]}..."
+                    )
+            
+            except ValueError as e:
+                last_error = e
+                logger.warning(f"⚠️ 第 {attempt} 次尝试失败: {e}")
+                
+                if attempt < max_retries:
+                    logger.info(f"   准备第 {attempt + 1} 次重试...")
+                    continue
+                else:
+                    logger.error(f"❌ 验证失败，已达到最大重试次数 {max_retries}")
+                    raise ValueError(
+                        f"AI 返回的 JSON 格式不符合要求，已重试 {max_retries} 次。\n"
+                        f"错误: {e}"
+                    )
+            
+            except Exception as e:
+                logger.error(f"❌ 第 {attempt} 次调用出现未预期错误: {type(e).__name__}: {e}")
+                if attempt < max_retries:
+                    logger.info(f"   准备第 {attempt + 1} 次重试...")
+                    last_error = e
+                    continue
+                else:
+                    raise
+        
+        # 理论上不会到达这里，但以防万一
+        raise ValueError(f"JSON 调用失败，已重试 {max_retries} 次。最后错误: {last_error}")


 # 创建全局AI服务实例