docs: add story-first markdown-first design

2026-03-19 16:01:09 +08:00
parent c6e07ce5ca
commit 13e3124b85
3 changed files with 678 additions and 162 deletions
--- a/api/app/agents/memoir/init.py
+++ b/api/app/agents/memoir/init.py
@@ -1,11 +1,7 @@
 """回忆录模块：MemoryAgent、BackgroundTaskRunner、MemoirOrchestrator、各 Specialist Agent"""

 from app.agents.memoir.memory_agent import MemoryAgent
-from app.agents.memoir.processor import (
-    BackgroundTaskRunner,
-    ContentAnalyzer,
-    MemoirGenerator,
-)
+from app.agents.memoir.processor import BackgroundTaskRunner
 from app.agents.memoir.orchestrator import MemoirOrchestrator
 from app.agents.memoir.extraction_agent import ExtractionAgent, ExtractionResult
 from app.agents.memoir.classification_agent import ClassificationAgent
@@ -15,8 +11,6 @@ from app.agents.memoir.placeholder_agent import inject_placeholders
 __all__ = [
    "MemoryAgent",
    "BackgroundTaskRunner",
-    "ContentAnalyzer",
-    "MemoirGenerator",
    "MemoirOrchestrator",
    "ExtractionAgent",
    "ExtractionResult",
--- a/api/app/agents/memoir/processor.py
+++ b/api/app/agents/memoir/processor.py
@@ -1,176 +1,23 @@
 """
-回忆录后台处理器：分析对话、更新状态、生成章节、创意标题
-使用 Celery 进行后台任务处理
+回忆录后台处理器：debounce 聚合后派发 Celery 任务
+实际回忆录生成由 memoir_tasks.process_memoir_segments 调用 MemoirOrchestrator 完成
 """

 from __future__ import annotations

-import json
-from dataclasses import dataclass
 from typing import Dict, List

-from app.core.dependencies import get_llm_provider
 from app.core.logging import get_logger
 from app.core.task_tracker import task_tracker

-from app.agents.state_schema import MemoirStateSchema
-from app.features.memoir.memoir_images.json_payload import extract_json_payload
-from app.agents.memoir.prompts import (
-    get_creative_title_prompt,
-    get_narrative_json_prompt,
-    get_state_extraction_prompt,
-)
-
 logger = get_logger(__name__)

-STAGE_KEYWORDS = {
-    "childhood": ["童年", "小时候", "出生", "家乡", "小镇"],
-    "education": ["上学", "学校", "老师", "同学", "教育", "大学"],
-    "career": ["工作", "职业", "事业", "公司", "同事", "创业"],
-    "family": ["伴侣", "孩子", "家庭", "家人", "结婚", "父母"],
-    "belief": ["信念", "价值观", "座右铭", "坚持", "原则"],
-}
-
-
-def _get_langchain_llm():
-    try:
-        provider = get_llm_provider()
-        return getattr(provider, "langchain_llm", None)
-    except Exception:
-        return None
-
-
-@dataclass
-class AnalysisResult:
-    detected_stage: str
-    extracted_slots: Dict[str, str]
-    emotion: str
-    is_new_chapter: bool
-
-
-class ContentAnalyzer:
-    def __init__(self) -> None:
-        self.llm = _get_langchain_llm()
-
-    def _detect_stage(self, user_message: str, fallback_stage: str) -> str:
-        message = user_message.lower()
-        for stage, keywords in STAGE_KEYWORDS.items():
-            if any(word in message for word in keywords):
-                return stage
-        return fallback_stage
-
-    def _fallback_slots(
-        self, state: MemoirStateSchema, stage: str, user_message: str
-    ) -> Dict[str, str]:
-        stage_slots = state.slots.get(stage, {})
-        for key, value in stage_slots.items():
-            if not value.snippet:
-                return {key: user_message.strip()[:200]}
-        return {}
-
-    async def analyze_message(
-        self, user_message: str, current_state: MemoirStateSchema
-    ) -> AnalysisResult:
-        detected_stage = self._detect_stage(user_message, current_state.current_stage)
-        extracted_slots: Dict[str, str] = {}
-        emotion = "neutral"
-        is_new_chapter = False
-        if self.llm:
-            try:
-                prompt = get_state_extraction_prompt(
-                    user_message=user_message,
-                    current_stage=current_state.current_stage,
-                    stage_slots=current_state.slots.get(detected_stage, {}),
-                )
-                json_llm = self.llm.bind(
-                    model_kwargs={"response_format": {"type": "json_object"}},
-                    max_tokens=1024,
-                )
-                response = await json_llm.ainvoke(prompt)
-                content = response.content.strip()
-                parsed = json.loads(extract_json_payload(content))
-                detected_stage = parsed.get("detected_stage", detected_stage)
-                extracted_slots = parsed.get("slots", {}) or {}
-                emotion = parsed.get("emotion", emotion)
-                is_new_chapter = bool(parsed.get("is_new_chapter", is_new_chapter))
-            except json.JSONDecodeError:
-                extracted_slots = self._fallback_slots(
-                    current_state, detected_stage, user_message
-                )
-            except Exception as e:
-                logger.error("分析消息失败: %s", e)
-                extracted_slots = self._fallback_slots(
-                    current_state, detected_stage, user_message
-                )
-        else:
-            extracted_slots = self._fallback_slots(
-                current_state, detected_stage, user_message
-            )
-        return AnalysisResult(
-            detected_stage=detected_stage,
-            extracted_slots=extracted_slots,
-            emotion=emotion,
-            is_new_chapter=is_new_chapter,
-        )
-
-
-class MemoirGenerator:
-    def __init__(self) -> None:
-        self.llm = _get_langchain_llm()
-
-    async def generate_chapter_title(
-        self, stage: str, slots: Dict[str, str], emotion: str
-    ) -> str:
-        if not self.llm:
-            return f"{stage} 回忆"
-        try:
-            prompt = get_creative_title_prompt(
-                stage=stage, emotion=emotion, slots=slots
-            )
-            response = await self.llm.ainvoke(prompt)
-            return response.content.strip().strip('"')
-        except Exception as e:
-            logger.error("生成标题失败: %s", e)
-            return f"{stage} 回忆"
-
-    async def generate_narrative(
-        self,
-        stage: str,
-        slots: Dict[str, str],
-        new_content: str,
-        existing_content: str,
-    ) -> str:
-        if not self.llm:
-            if existing_content:
-                return f"{existing_content}\n\n{new_content}"
-            return new_content
-        try:
-            prompt = get_narrative_json_prompt(
-                stage=stage,
-                slots=slots,
-                new_content=new_content,
-                existing_content=existing_content,
-            )
-            json_llm = self.llm.bind(
-                model_kwargs={"response_format": {"type": "json_object"}},
-                max_tokens=4096,
-            )
-            response = await json_llm.ainvoke(prompt)
-            return response.content.strip()
-        except Exception as e:
-            logger.error("生成叙事失败: %s", e)
-            if existing_content:
-                return f"{existing_content}\n\n{new_content}"
-            return new_content
-

 class BackgroundTaskRunner:
    def __init__(self, debounce_seconds: int = 5) -> None:
        self.debounce_seconds = debounce_seconds
        self._pending: Dict[str, List[str]] = {}
        self._timers: Dict[str, object] = {}
-        self.analyzer = ContentAnalyzer()
-        self.generator = MemoirGenerator()

    async def _submit_task(self, user_id: str, segment_ids: List[str]) -> str | None:
        try: