life-echo/api/app/agents/chat/orchestrator.py

"""
ChatOrchestrator：AI 回复用户模块的编排层
负责路由（Profile vs Interview）、调用 Specialist Agent；持久化由 feature 层 ConversationHistoryStore 完成。
"""

import time
from collections.abc import Callable
from datetime import datetime
from typing import TYPE_CHECKING, List, Optional

from sqlalchemy.ext.asyncio import AsyncSession

from app.agents.chat.agent_turn import AgentChatTurn
from app.agents.chat.helpers import get_history_with_window
from app.agents.chat.interview_agent import InterviewAgent
from app.agents.chat.interview_state_hints import (
    build_runtime_interview_state,
    extract_scene_cues,
)
from app.agents.chat.profile_agent import ProfileAgent
from app.agents.chat.stage_detection import (
    detect_primary_life_stage,
    life_stage_display_name,
)
from app.agents.state_schema import MemoirStateSchema
from app.core.agent_logging import agent_summary_enabled, log_agent_detail
from app.core.config import settings
from app.core.dependencies import get_embedding_provider
from app.core.llm_gateway import LlmGateway
from app.core.logging import get_logger
from app.features.conversation.input_normalize import normalize_chat_input_for_agent
from app.features.memoir.state_service import (
    get_or_create_state,
    save_interview_state_meta,
    switch_stage,
)
from app.features.memory.prompt_adapter import MemoryPromptAdapter
from app.features.conversation.constants import chat
from app.features.memory.constants import memory
from app.features.story.constants import story


def _llm_for_chat_input_normalize():
    try:
        return LlmGateway().langchain_llm_for()
    except Exception:
        return None


if TYPE_CHECKING:
    from app.features.user.models import User
    from app.ports.embedding import EmbeddingProvider
    from app.ports.llm import LLMProvider

logger = get_logger(__name__)

_UNAUTH_TURN_ZH = AgentChatTurn(
    messages=["暂时没法继续对话，请先登录后再试。"], skip_tts=True
)
_UNAUTH_TURN_EN = AgentChatTurn(
    messages=["You'll need to sign in again before we can continue."],
    skip_tts=True,
)


def _user_language(user: Optional["User"]) -> str:
    if not user:
        return "zh"
    lang = getattr(user, "language_preference", None) or "zh"
    return "en" if str(lang).lower() == "en" else "zh"


async def _fetch_interview_memory_bundle(
    db: AsyncSession,
    user_id: str,
    user_message: str,
    *,
    get_embedding_provider_fn: Callable[[], "EmbeddingProvider"],
) -> tuple[dict | None, object | None]:
    """检索记忆 bundle（原始结构）；是否进主 prompt 由 adapter 再筛。"""
    from app.features.memory.retrieval_trace import (
        chat_memory_retrieval_trace_from_bundle,
    )
    from app.features.memory.service import MemoryService

    if not chat.memory_retrieval_enabled:
        logger.debug(
            "event=chat_memory_retrieval_skip reason=disabled user_id={}", user_id
        )
        return None, None
    msg = (user_message or "").strip()
    if not msg:
        logger.debug(
            "event=chat_memory_retrieval_skip reason=empty user_id={}", user_id
        )
        return None, None
    try:
        emb = get_embedding_provider_fn()
        ms = MemoryService(db, embedding_provider=emb)
        top_k = chat.memory_top_k
        bundle = await ms.retrieve(user_id, msg, top_k=top_k)
        bd = bundle.model_dump()
        trace = chat_memory_retrieval_trace_from_bundle(
            bd, top_k=top_k, query_len=len(msg)
        )
        logger.info(
            "event=memory_retrieval_bundle user_id={} top_k={}",
            user_id,
            top_k,
        )
        return bd, trace
    except Exception as e:
        try:
            await db.rollback()
        except Exception as rollback_error:
            logger.warning("访谈记忆检索失败后回滚也失败: {}", rollback_error)
        logger.warning("访谈记忆检索失败: {}", e)
        return None, None


class ChatOrchestrator:
    """
    聊天编排器：根据用户资料完成度路由到 ProfileAgent 或 InterviewAgent。
    不直接写入 Redis/DB；由 WS pipeline / ConversationHistoryStore 落库并同步缓存。

    ``get_embedding_provider_fn`` / ``llm_provider`` 供测试或脚本注入；默认使用全局依赖。
    """

    def __init__(
        self,
        *,
        get_embedding_provider_fn: Callable[[], "EmbeddingProvider"] | None = None,
        llm_provider: "LLMProvider | None" = None,
    ):
        self._get_embedding_provider_fn = (
            get_embedding_provider_fn or get_embedding_provider
        )
        self.profile_agent = ProfileAgent(llm_provider=llm_provider)
        self.interview_agent = InterviewAgent()
        self.memory_prompt_adapter = MemoryPromptAdapter()

    async def process_user_message(
        self,
        conversation_id: str,
        user_message: str,
        user: Optional["User"],
        conversation,  # 用于更新 conversation_stage
        is_from_voice: bool,
        voice_session_id: Optional[str],
        db: AsyncSession,
        apply_extracted_profile_fn,
        get_missing_profile_fields_fn,
        get_filled_profile_fields_fn,
        user_message_timestamp: Optional[datetime] = None,
        audio_duration_seconds: Optional[int] = None,
    ) -> AgentChatTurn:
        """
        处理用户消息，返回 AI 回复（分段 + 是否跳过 TTS）。
        根据 missing_fields 路由到 ProfileAgent 或 InterviewAgent。
        """
        t0 = time.perf_counter()
        language = _user_language(user)

        # --- 资料收集模式 ---
        if user:
            missing = get_missing_profile_fields_fn(user)
            if missing:
                hw_profile = await get_history_with_window(
                    conversation_id,
                    max_pairs=chat.history_max_pairs,
                    max_chars=chat.history_max_chars,
                )
                profile_turn_total = hw_profile.turn_total
                if profile_turn_total >= chat.profile_max_turns:
                    logger.info(
                        "event=chat_profile_cap_skip conversation_id={} "
                        "turn_total={} cap={} missing_fields={}",
                        conversation_id,
                        profile_turn_total,
                        chat.profile_max_turns,
                        missing,
                    )
                else:
                    try:
                        log_agent_detail(
                            logger,
                            "ChatOrchestrator route=profile conversation_id={} "
                            "missing_fields={} user_msg_len={} profile_turn_total={}",
                            conversation_id,
                            missing,
                            len(user_message or ""),
                            profile_turn_total,
                        )
                        # Profile 阶段每轮都抽取：短确认语也可能带可推断资料，跳过抽取会导致槽位长期不更新
                        extracted = (
                            await self.profile_agent.extract_profile_from_message(
                                user_message,
                                missing,
                                conversation_id=conversation_id,
                                language=language,
                            )
                        )
                        logger.info(
                            "event=chat_profile_extract conversation_id={} "
                            "extracted_keys={} missing_before={}",
                            conversation_id,
                            list(extracted.keys()) if extracted else [],
                            missing,
                        )
                        if extracted:
                            await apply_extracted_profile_fn(user, extracted, db)

                        remaining = get_missing_profile_fields_fn(user)
                        filled = get_filled_profile_fields_fn(user)
                        interview_stage_hint = ""
                        if not remaining:
                            st = await get_or_create_state(user.id, db)
                            interview_stage_hint = life_stage_display_name(
                                st.current_stage, language=language
                            )
                        responses = await self.profile_agent.generate_profile_followup(
                            conversation_id=conversation_id,
                            user_message=user_message,
                            missing_fields=remaining,
                            filled_fields=filled,
                            nickname=user.nickname or "",
                            interview_stage_hint=interview_stage_hint,
                            language=language,
                        )
                        if agent_summary_enabled():
                            logger.info(
                                "ChatOrchestrator.process_user_message route=profile "
                                "duration_ms={:.2f} conversation_id={} response_segments={}",
                                (time.perf_counter() - t0) * 1000,
                                conversation_id,
                                len(responses),
                            )
                        return AgentChatTurn(
                            messages=responses,
                            skip_tts=False,
                            memory_retrieval_trace=None,
                        )
                    except Exception as e:
                        logger.exception("资料收集处理失败: {}", e)
                        fb_msg = (
                            "Sorry, I missed that. Could you say it again?"
                            if language == "en"
                            else "不好意思刚才没接住，你再说一遍好吗？"
                        )
                        return AgentChatTurn(
                            messages=[fb_msg],
                            skip_tts=False,
                            memory_retrieval_trace=None,
                        )

        # --- 正式访谈模式 ---
        user_id = user.id if user else None
        if not user_id:
            if agent_summary_enabled():
                logger.info(
                    "ChatOrchestrator.process_user_message route=unauth "
                    "duration_ms={:.2f} conversation_id={}",
                    (time.perf_counter() - t0) * 1000,
                    conversation_id,
                )
            return _UNAUTH_TURN_EN if language == "en" else _UNAUTH_TURN_ZH

        log_agent_detail(
            logger,
            "ChatOrchestrator route=interview conversation_id={} user_msg_len={}",
            conversation_id,
            len(user_message or ""),
        )
        llm_n = None
        if chat.input_normalize_enabled and (
            (chat.input_normalize_mode or "").strip().lower() == "llm"
        ):
            llm_n = _llm_for_chat_input_normalize()
        normalized_user_message = normalize_chat_input_for_agent(
            user_message or "",
            llm=llm_n,
            is_from_voice=is_from_voice,
        )
        state = await get_or_create_state(user_id, db)
        stage_before = state.current_stage
        detected = await detect_primary_life_stage(
            normalized_user_message,
            state.current_stage,
            self.interview_agent.llm,
        )
        stage_switched_this_turn = detected != stage_before
        if stage_switched_this_turn:
            state = await switch_stage(user_id, detected, db)

        if conversation and conversation.conversation_stage != state.current_stage:
            from app.core.db import transactional

            async with transactional(db):
                conversation.conversation_stage = state.current_stage

        from app.agents.chat.background_voice import infer_background_voice
        from app.agents.chat.prompts_profile import format_user_profile_context

        user_profile_context = ""
        background_voice = "default"
        occupation = ""
        if user:
            user_profile_context = format_user_profile_context(
                birth_year=user.birth_year,
                birth_place=user.birth_place,
                grew_up_place=user.grew_up_place,
                occupation=user.occupation,
                language=language,
            )
            background_voice = infer_background_voice(user.occupation)
            occupation = user.occupation or ""

        memory_bundle, mem_trace = await _fetch_interview_memory_bundle(
            db,
            user_id,
            normalized_user_message,
            get_embedding_provider_fn=self._get_embedding_provider_fn,
        )
        mem_slices = self.memory_prompt_adapter.slice_for_interview(
            memory_bundle,
            normalized_user_message,
        )
        # 场景关键词仅作为 focus planner 的辅助输入，不直接拼进记忆块，避免抢过用户明确的关系/身份线索
        scene_cues_for_planner = extract_scene_cues(normalized_user_message)

        profile_birth_year = user.birth_year if user else None
        profile_era_place = ""
        if user:
            profile_era_place = (user.birth_place or user.grew_up_place or "").strip()
        prompt_state = build_runtime_interview_state(
            state,
            user_message=normalized_user_message,
            active_stage=detected or state.current_stage,
            birth_year=profile_birth_year,
            birth_place=(user.birth_place or "").strip() if user else "",
            grew_up_place=(user.grew_up_place or "").strip() if user else "",
            occupation=occupation,
        )

        turn = await self.interview_agent.generate_response_with_state(
            conversation_id=conversation_id,
            user_message=user_message,
            memoir_state=prompt_state,
            user_profile_context=user_profile_context,
            detected_user_stage=detected,
            memory_evidence_text=mem_slices.prompt_excerpt,
            memory_anchor_source=mem_slices.anchor_source,
            memory_planner_text=mem_slices.planner_preview,
            background_voice=background_voice,
            normalized_user_message=normalized_user_message,
            occupation=occupation,
            profile_birth_year=profile_birth_year,
            profile_era_place=profile_era_place,
            stage_switched_this_turn=stage_switched_this_turn,
            scene_cues_for_planner=scene_cues_for_planner,
            language=language,
        )
        recent_questions = prompt_state.recent_questions
        if turn.interview_state_meta and isinstance(turn.interview_state_meta, dict):
            raw_recent = turn.interview_state_meta.get("recent_questions")
            if isinstance(raw_recent, list):
                recent_questions = [
                    str(x).strip() for x in raw_recent if str(x).strip()
                ]
        await save_interview_state_meta(
            user_id,
            known_facts=prompt_state.known_facts,
            persona_threads=prompt_state.persona_threads,
            recent_questions=recent_questions,
            db=db,
        )
        if agent_summary_enabled():
            logger.info(
                "ChatOrchestrator.process_user_message route=interview "
                "duration_ms={:.2f} conversation_id={} stage={} response_segments={} skip_tts={}",
                (time.perf_counter() - t0) * 1000,
                conversation_id,
                state.current_stage,
                len(turn.messages),
                turn.skip_tts,
            )
        if mem_trace is not None:
            return AgentChatTurn(
                messages=turn.messages,
                skip_tts=turn.skip_tts,
                memory_retrieval_trace=mem_trace,
                interview_state_meta=turn.interview_state_meta,
            )
        return turn

    async def extract_profile_from_message(
        self,
        user_message: str,
        missing_fields: List[str],
        conversation_id: Optional[str] = None,
    ):
        """委托 ProfileAgent 提取资料"""
        return await self.profile_agent.extract_profile_from_message(
            user_message, missing_fields, conversation_id=conversation_id
        )

    async def generate_profile_followup(
        self,
        conversation_id: str,
        user_message: str,
        missing_fields: List[str],
        filled_fields: dict,
        nickname: str = "",
        is_from_voice: bool = False,
        voice_session_id: str | None = None,
        user_message_timestamp: datetime | None = None,
        audio_duration_seconds: int | None = None,
        language: str = "zh",
    ) -> List[str]:
        """委托 ProfileAgent 生成资料追问（持久化由调用方负责）。"""
        return await self.profile_agent.generate_profile_followup(
            conversation_id=conversation_id,
            user_message=user_message,
            missing_fields=missing_fields,
            filled_fields=filled_fields,
            nickname=nickname,
            language=language,
        )

    async def generate_profile_greeting(
        self,
        conversation_id: str,
        missing_fields: List[str],
        nickname: str = "",
        language: str = "zh",
    ) -> List[str]:
        """委托 ProfileAgent 生成资料收集开场白（持久化由调用方负责）。"""
        return await self.profile_agent.generate_profile_greeting(
            conversation_id=conversation_id,
            missing_fields=missing_fields,
            nickname=nickname,
            language=language,
        )

    async def generate_response_with_state(
        self,
        conversation_id: str,
        user_message: str,
        memoir_state: MemoirStateSchema,
        user_profile_context: str = "",
        is_from_voice: bool = False,
        voice_session_id: str | None = None,
        user_message_timestamp: datetime | None = None,
        audio_duration_seconds: int | None = None,
        detected_user_stage: str | None = None,
        memory_evidence_text: str = "",
        memory_anchor_source: str = "",
        memory_planner_text: str = "",
        background_voice: str = "default",
        normalized_user_message: str | None = None,
        occupation: str = "",
        profile_birth_year: int | None = None,
        profile_era_place: str = "",
        stage_switched_this_turn: bool = False,
        scene_cues_for_planner: Optional[list[str]] = None,
        language: str = "zh",
    ) -> AgentChatTurn:
        """委托 InterviewAgent 生成访谈回复（持久化由调用方负责）。"""
        return await self.interview_agent.generate_response_with_state(
            conversation_id=conversation_id,
            user_message=user_message,
            memoir_state=memoir_state,
            user_profile_context=user_profile_context,
            detected_user_stage=detected_user_stage,
            memory_evidence_text=memory_evidence_text,
            memory_anchor_source=memory_anchor_source,
            memory_planner_text=memory_planner_text,
            background_voice=background_voice,
            normalized_user_message=normalized_user_message,
            occupation=occupation,
            profile_birth_year=profile_birth_year,
            profile_era_place=profile_era_place,
            stage_switched_this_turn=stage_switched_this_turn,
            scene_cues_for_planner=scene_cues_for_planner,
            language=language,
        )

    def detect_user_stage(self, user_message: str) -> str:
        """委托 InterviewAgent 检测用户阶段"""
        return self.interview_agent._detect_user_stage(user_message)

    async def generate_opening_message(
        self,
        conversation_id: str,
        memoir_state: MemoirStateSchema,
        user_profile_context: str = "",
        background_voice: str = "default",
        occupation: str = "",
        profile_birth_year: Optional[int] = None,
        profile_era_place: str = "",
        language: str = "zh",
    ) -> List[str]:
        """
        委托 InterviewAgent 生成访谈开场白（持久化由调用方 ConversationHistoryStore 负责）。
        """
        return await self.interview_agent.generate_opening_message(
            conversation_id=conversation_id,
            memoir_state=memoir_state,
            user_profile_context=user_profile_context,
            background_voice=background_voice,
            occupation=occupation,
            profile_birth_year=profile_birth_year,
            profile_era_place=profile_era_place,
            language=language,
        )

    async def generate_re_greeting_message(
        self,
        conversation_id: str,
        memoir_state: MemoirStateSchema,
        idle_hours: float,
        user_profile_context: str = "",
        background_voice: str = "default",
        occupation: str = "",
        profile_birth_year: Optional[int] = None,
        profile_era_place: str = "",
        language: str = "zh",
    ) -> List[str]:
        """委托 InterviewAgent 生成老对话回访问候（持久化由调用方负责）。"""
        return await self.interview_agent.generate_re_greeting_message(
            conversation_id=conversation_id,
            memoir_state=memoir_state,
            idle_hours=idle_hours,
            user_profile_context=user_profile_context,
            background_voice=background_voice,
            occupation=occupation,
            profile_birth_year=profile_birth_year,
            profile_era_place=profile_era_place,
            language=language,
        )