"""剧情分析服务 - 自动分析章节的钩子、伏笔、冲突等元素""" from typing import Dict, Any, List, Optional from sqlalchemy.ext.asyncio import AsyncSession from app.services.ai_service import AIService from app.services.prompt_service import prompt_service, PromptService from app.logger import get_logger import json import re logger = get_logger(__name__) class PlotAnalyzer: """剧情分析器 - 使用AI分析章节内容""" def __init__(self, ai_service: AIService): """ 初始化剧情分析器 Args: ai_service: AI服务实例 """ self.ai_service = ai_service logger.info("✅ PlotAnalyzer初始化成功") async def analyze_chapter( self, chapter_number: int, title: str, content: str, word_count: int, user_id: str = None, db: AsyncSession = None ) -> Optional[Dict[str, Any]]: """ 分析单章内容 Args: chapter_number: 章节号 title: 章节标题 content: 章节内容 word_count: 字数 user_id: 用户ID(用于获取自定义提示词) db: 数据库会话(用于查询自定义提示词) Returns: 分析结果字典,失败返回None """ try: logger.info(f"🔍 开始分析第{chapter_number}章: {title}") # 如果内容过长,截取前8000字(避免超token) analysis_content = content[:8000] if len(content) > 8000 else content # 获取自定义提示词模板 if user_id and db: template = await PromptService.get_template("PLOT_ANALYSIS", user_id, db) else: # 降级到系统默认模板 template = PromptService.PLOT_ANALYSIS # 格式化提示词 prompt = PromptService.format_prompt( template, chapter_number=chapter_number, title=title, word_count=word_count, content=analysis_content ) # 调用AI进行分析 # 注意:不指定max_tokens,使用用户在设置中配置的值 logger.info(f" 调用AI分析(内容长度: {len(analysis_content)}字)...") response = await self.ai_service.generate_text( prompt=prompt, temperature=0.3 # 降低温度以获得更稳定的JSON输出 ) # 🔍 添加调试日志:查看AI返回的原始内容 # logger.info(f"🔍 AI返回类型: {type(response)}") # logger.info(f"🔍 AI返回内容(前500字符): {str(response)}") # 从返回的字典中提取content字段 if isinstance(response, dict): response_text = response.get('content', '') if not response_text: logger.error("❌ AI返回的字典中没有content字段或content为空") return None else: # 兼容旧的字符串返回格式 response_text = response # 解析JSON结果 analysis_result = self._parse_analysis_response(response_text) if analysis_result: logger.info(f"✅ 第{chapter_number}章分析完成") logger.info(f" - 钩子: {len(analysis_result.get('hooks', []))}个") logger.info(f" - 伏笔: {len(analysis_result.get('foreshadows', []))}个") logger.info(f" - 情节点: {len(analysis_result.get('plot_points', []))}个") logger.info(f" - 整体评分: {analysis_result.get('scores', {}).get('overall', 'N/A')}") return analysis_result else: logger.error(f"❌ 第{chapter_number}章分析失败: JSON解析错误") return None except Exception as e: logger.error(f"❌ 章节分析异常: {str(e)}") return None def _parse_analysis_response(self, response: str) -> Optional[Dict[str, Any]]: """ 解析AI返回的分析结果(使用统一的JSON清洗方法) Args: response: AI返回的文本 Returns: 解析后的字典,失败返回None """ try: # 使用统一的JSON清洗方法 cleaned = self.ai_service._clean_json_response(response) # 尝试解析JSON result = json.loads(cleaned) # 验证必要字段 required_fields = ['hooks', 'plot_points', 'scores'] for field in required_fields: if field not in result: logger.warning(f"⚠️ 分析结果缺少字段: {field}") result[field] = [] if field != 'scores' else {} logger.info("✅ 成功解析分析结果") return result except json.JSONDecodeError as e: logger.error(f"❌ JSON解析失败: {str(e)}") logger.error(f" 原始响应(前500字): {response[:500]}") return None except Exception as e: logger.error(f"❌ 解析异常: {str(e)}") return None def extract_memories_from_analysis( self, analysis: Dict[str, Any], chapter_id: str, chapter_number: int, chapter_content: str = "", chapter_title: str = "" ) -> List[Dict[str, Any]]: """ 从分析结果中提取记忆片段 Args: analysis: 分析结果 chapter_id: 章节ID chapter_number: 章节号 chapter_content: 章节完整内容(用于计算位置) chapter_title: 章节标题 Returns: 记忆片段列表 """ memories = [] try: # 【新增】0. 提取章节摘要作为记忆(用于语义检索相关章节) chapter_summary = "" # 尝试从分析结果获取摘要 if analysis.get('summary'): chapter_summary = analysis.get('summary') # 或者从情节点组合生成摘要 elif analysis.get('plot_points'): plot_summaries = [p.get('content', '') for p in analysis.get('plot_points', [])[:3]] chapter_summary = ";".join(plot_summaries) # 或者使用内容前300字 elif chapter_content: chapter_summary = chapter_content[:300] + ("..." if len(chapter_content) > 300 else "") # 如果有摘要,添加到记忆中 if chapter_summary: memories.append({ 'type': 'chapter_summary', 'content': chapter_summary, 'title': f"第{chapter_number}章《{chapter_title}》摘要", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': 0.6, # 中等重要性 'tags': ['摘要', '章节概览', chapter_title], 'is_foreshadow': 0, 'text_position': 0, 'text_length': len(chapter_summary) } }) logger.info(f" ✅ 添加章节摘要记忆: {len(chapter_summary)}字") # 1. 提取钩子作为记忆 for i, hook in enumerate(analysis.get('hooks', [])): if hook.get('strength', 0) >= 6: # 只保存强度>=6的钩子 keyword = hook.get('keyword', '') position, length = self._find_text_position(chapter_content, keyword) logger.info(f" 钩子位置: keyword='{keyword[:30]}...', pos={position}, len={length}") memories.append({ 'type': 'hook', 'content': f"[{hook.get('type', '未知')}钩子] {hook.get('content', '')}", 'title': f"{hook.get('type', '钩子')} - {hook.get('position', '')}", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': min(hook.get('strength', 5) / 10, 1.0), 'tags': [hook.get('type', '钩子'), hook.get('position', '')], 'is_foreshadow': 0, 'keyword': keyword, 'text_position': position, 'text_length': length, 'strength': hook.get('strength', 5), 'position_desc': hook.get('position', '') } }) # 2. 提取伏笔作为记忆 for i, foreshadow in enumerate(analysis.get('foreshadows', [])): is_planted = foreshadow.get('type') == 'planted' keyword = foreshadow.get('keyword', '') position, length = self._find_text_position(chapter_content, keyword) logger.info(f" 伏笔位置: keyword='{keyword[:30]}...', pos={position}, len={length}") memories.append({ 'type': 'foreshadow', 'content': foreshadow.get('content', ''), 'title': f"{'埋下伏笔' if is_planted else '回收伏笔'}", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': min(foreshadow.get('strength', 5) / 10, 1.0), 'tags': ['伏笔', foreshadow.get('type', 'planted')], 'is_foreshadow': 1 if is_planted else 2, 'reference_chapter': foreshadow.get('reference_chapter'), 'keyword': keyword, 'text_position': position, 'text_length': length, 'foreshadow_type': foreshadow.get('type', 'planted'), 'strength': foreshadow.get('strength', 5) } }) # 3. 提取关键情节点 for i, plot_point in enumerate(analysis.get('plot_points', [])): if plot_point.get('importance', 0) >= 0.6: # 只保存重要性>=0.6的情节点 keyword = plot_point.get('keyword', '') position, length = self._find_text_position(chapter_content, keyword) logger.info(f" 情节点位置: keyword='{keyword[:30]}...', pos={position}, len={length}") memories.append({ 'type': 'plot_point', 'content': f"{plot_point.get('content', '')}。影响: {plot_point.get('impact', '')}", 'title': f"情节点 - {plot_point.get('type', '未知')}", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': plot_point.get('importance', 0.5), 'tags': ['情节点', plot_point.get('type', '未知')], 'is_foreshadow': 0, 'keyword': keyword, 'text_position': position, 'text_length': length } }) # 4. 提取角色状态变化 for i, char_state in enumerate(analysis.get('character_states', [])): char_name = char_state.get('character_name', '未知角色') memories.append({ 'type': 'character_event', 'content': f"{char_name}的状态变化: {char_state.get('state_before', '')} → {char_state.get('state_after', '')}。{char_state.get('psychological_change', '')}", 'title': f"{char_name}的变化", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': 0.7, 'tags': ['角色', char_name, '状态变化'], 'related_characters': [char_name], 'is_foreshadow': 0 } }) # 5. 如果有重要冲突,也记录下来 conflict = analysis.get('conflict', {}) if conflict and conflict.get('level', 0) >= 7: # 确保 parties 和 types 都是字符串列表 parties = conflict.get('parties', []) if parties and isinstance(parties, list): parties = [str(p) for p in parties] types = conflict.get('types', []) if types and isinstance(types, list): types = [str(t) for t in types] memories.append({ 'type': 'plot_point', 'content': f"重要冲突: {conflict.get('description', '')}。冲突各方: {', '.join(parties)}", 'title': f"冲突 - 强度{conflict.get('level', 0)}", 'metadata': { 'chapter_id': chapter_id, 'chapter_number': chapter_number, 'importance_score': min(conflict.get('level', 5) / 10, 1.0), 'tags': ['冲突'] + types, 'is_foreshadow': 0 } }) logger.info(f"📝 从分析中提取了{len(memories)}条记忆") return memories except Exception as e: logger.error(f"❌ 提取记忆失败: {str(e)}") return [] def _find_text_position(self, full_text: str, keyword: str) -> tuple[int, int]: """ 在全文中查找关键词位置 Args: full_text: 完整文本 keyword: 关键词 Returns: (起始位置, 长度) 如果未找到返回(-1, 0) """ if not keyword or not full_text: return (-1, 0) try: # 1. 精确匹配 pos = full_text.find(keyword) if pos != -1: return (pos, len(keyword)) # 2. 去除标点符号后匹配 import re clean_keyword = re.sub(r'[,。!?、;:""''()《》【】]', '', keyword) clean_text = re.sub(r'[,。!?、;:""''()《》【】]', '', full_text) pos = clean_text.find(clean_keyword) if pos != -1: # 反向映射到原文位置(简化处理) return (pos, len(clean_keyword)) # 3. 模糊匹配:查找关键词的前半部分 if len(keyword) > 10: partial = keyword[:min(15, len(keyword))] pos = full_text.find(partial) if pos != -1: return (pos, len(partial)) # 4. 未找到 logger.debug(f"未找到关键词位置: {keyword[:30]}...") return (-1, 0) except Exception as e: logger.error(f"查找位置失败: {str(e)}") return (-1, 0) def generate_analysis_summary(self, analysis: Dict[str, Any]) -> str: """ 生成分析摘要文本 Args: analysis: 分析结果 Returns: 格式化的摘要文本 """ try: lines = ["=== 章节分析报告 ===\n"] # 整体评分 scores = analysis.get('scores', {}) lines.append(f"【整体评分】") lines.append(f" 整体质量: {scores.get('overall', 'N/A')}/10") lines.append(f" 节奏把控: {scores.get('pacing', 'N/A')}/10") lines.append(f" 吸引力: {scores.get('engagement', 'N/A')}/10") lines.append(f" 连贯性: {scores.get('coherence', 'N/A')}/10\n") # 剧情阶段 lines.append(f"【剧情阶段】{analysis.get('plot_stage', '未知')}\n") # 钩子统计 hooks = analysis.get('hooks', []) if hooks: lines.append(f"【钩子分析】共{len(hooks)}个") for hook in hooks[:3]: # 只显示前3个 lines.append(f" • [{hook.get('type')}] {hook.get('content', '')[:50]}... (强度:{hook.get('strength', 0)})") lines.append("") # 伏笔统计 foreshadows = analysis.get('foreshadows', []) if foreshadows: planted = sum(1 for f in foreshadows if f.get('type') == 'planted') resolved = sum(1 for f in foreshadows if f.get('type') == 'resolved') lines.append(f"【伏笔分析】埋下{planted}个, 回收{resolved}个\n") # 冲突分析 conflict = analysis.get('conflict', {}) if conflict: lines.append(f"【冲突分析】") lines.append(f" 类型: {', '.join(conflict.get('types', []))}") lines.append(f" 强度: {conflict.get('level', 0)}/10") lines.append(f" 进度: {int(conflict.get('resolution_progress', 0) * 100)}%\n") # 改进建议 suggestions = analysis.get('suggestions', []) if suggestions: lines.append(f"【改进建议】") for i, sug in enumerate(suggestions, 1): lines.append(f" {i}. {sug}") return "\n".join(lines) except Exception as e: logger.error(f"❌ 生成摘要失败: {str(e)}") return "分析摘要生成失败" # 创建全局实例(需要时手动初始化) _plot_analyzer_instance = None def get_plot_analyzer(ai_service: AIService) -> PlotAnalyzer: """获取剧情分析器实例""" global _plot_analyzer_instance if _plot_analyzer_instance is None: _plot_analyzer_instance = PlotAnalyzer(ai_service) return _plot_analyzer_instance