api/app/agents/chat/interview_agent.py

"""
InterviewAgent：正式访谈 Specialist
负责状态感知回复、开场白，不负责 Redis 持久化（由 Orchestrator 统一处理）
"""

import time
from typing import Any, List, Optional

from langchain_core.messages import HumanMessage, SystemMessage

from app.agents.chat.agent_turn import AgentChatTurn
from app.agents.chat.helpers import format_history_string, get_history_with_window
from app.agents.chat.interview_state_hints import (
    apply_autobiographical_boundary_guard,
    apply_duplicate_question_guard,
    extract_recent_questions,
    segments_are_only_duplicate_guard_fallback,
    update_recent_questions,
)
from app.agents.chat.interview_turn_plan import plan_interview_turn
from app.agents.chat.personas import normalize_interview_persona
from app.agents.chat.prompt_context import ChatPromptContext
from app.agents.chat.prompts_conversation import (
    SLOT_NAME_MAP,
    get_opening_prompt,
)
from app.agents.chat.reply_limits import (
    nonempty_segments_or_fallback,
    segments_from_llm_response,
    truncate_chat_segments,
)
from app.agents.chat.reply_planner import maybe_refine_turn_plan_with_llm
from app.agents.chat.stage_detection import keyword_fallback_primary_stage
from app.agents.state_schema import (
    MemoirStateSchema,
    interview_control_state,
    narrative_coverage_state,
)
from app.core.agent_logging import (
    agent_span,
    log_agent_payload,
    log_agent_summary,
)
from app.core.config import settings
from app.core.llm_gateway import LlmGateway, LlmUseCase
from app.core.logging import get_logger
from app.features.conversation.input_normalize import normalize_chat_input_for_agent

logger = get_logger(__name__)

# LLM 不可用或调用失败时对用户展示（不暴露异常细节、不触发 TTS）
_FALLBACK_REPLY = "刚才网络不太稳，没接上。你可以再说一遍，或稍后再试。"

# 仅在「重复问句守卫」把正文削成单句兜底时追加二次 system，只多调一次模型。
_DUPLICATE_GUARD_LLM_RETRY_SYSTEM_APPENDIX = """## 二次生成（纠偏）
上一版模型输出因包含与「最近已问过的问题」或「已确认事实」重复的问句，已被系统弃用。请**重新写一整条回复**：
- 仍须遵守上文全部主规则；
- 先贴着用户本轮原话承接半句到一两句（可有画面感）；
- **禁止**再用与刚才同义、仅换说法的确认型问句；
- 若要提问，须换**全新角度**，并锚在用户刚说的具体细节里；也可以本轮**完全不提问**，只并肩承接；
- **禁止**整段只有「这一段我记住了」或同类无信息套话。"""


def _finalize_chat_segments_after_llm(
    response_text: str,
    *,
    max_segments: int,
    max_chars: int,
    memoir_state: MemoirStateSchema,
    recent_questions: list[str],
) -> tuple[list[str], bool]:
    raw_list = segments_from_llm_response(
        response_text,
        max_segments=max_segments,
    )
    if not raw_list:
        raw_list = [response_text.strip()]
    out = truncate_chat_segments(
        raw_list,
        max_segments=max_segments,
        max_chars_per_segment=max_chars,
    )
    if not out:
        out = [response_text.strip()[:max_chars]]
    out = nonempty_segments_or_fallback(out, fallback=_FALLBACK_REPLY)
    out, deduped = apply_duplicate_question_guard(
        out,
        state=memoir_state,
        recent_questions=recent_questions,
    )
    return out, deduped


def _get_langchain_llm():
    try:
        return LlmGateway().langchain_llm_for(LlmUseCase("chat.interview"))
    except Exception:
        return None


def _message_contents_char_count(messages: List[Any]) -> int:
    n = 0
    for m in messages:
        c = getattr(m, "content", None)
        if isinstance(c, str):
            n += len(c)
    return n


class InterviewAgent:
    """正式访谈 Specialist Agent"""

    def __init__(self):
        self.llm = _get_langchain_llm()

    def _detect_user_stage(self, user_message: str) -> str:
        """关键词回退：与 stage_detection 一致（多阶段打分）。"""
        return keyword_fallback_primary_stage(user_message)

    def _resolve_text_for_model(
        self,
        user_message: str,
        normalized_user_message: Optional[str],
    ) -> str:
        """模型侧净稿：编排层已归一则直接用；否则在本层补一次（含可选 LLM）。"""
        if normalized_user_message is not None:
            return (normalized_user_message or "").strip()
        llm_n = None
        if settings.chat_input_normalize_enabled and (
            (settings.chat_input_normalize_mode or "").strip().lower() == "llm"
        ):
            llm_n = self.llm
        return normalize_chat_input_for_agent(user_message or "", llm=llm_n)

    async def generate_response_with_state(
        self,
        conversation_id: str,
        user_message: str,
        memoir_state: MemoirStateSchema,
        user_profile_context: str = "",
        detected_user_stage: Optional[str] = None,
        memory_evidence_text: str = "",
        memory_anchor_source: str = "",
        memory_planner_text: str = "",
        background_voice: str = "default",
        normalized_user_message: Optional[str] = None,
        occupation: str = "",
        profile_birth_year: int | None = None,
        profile_era_place: str = "",
        stage_switched_this_turn: bool = False,
        scene_cues_for_planner: Optional[list[str]] = None,
    ) -> AgentChatTurn:
        """生成状态感知的访谈回复，不持久化（由 Orchestrator 负责）"""
        if not self.llm:
            logger.warning("InterviewAgent: LLM 未配置，返回兜底文案")
            return AgentChatTurn(messages=[_FALLBACK_REPLY], skip_tts=True)
        try:
            text_for_model = self._resolve_text_for_model(
                user_message, normalized_user_message
            )
            narrative_state = narrative_coverage_state(memoir_state)
            control_state = interview_control_state(memoir_state)
            empty_slots = control_state.prompt_empty_slots_for_stage(
                narrative_state, memoir_state.current_stage
            )
            filled_slots = narrative_state.filled_slots_for_stage(
                memoir_state.current_stage
            )
            if detected_user_stage is not None:
                du = detected_user_stage
            else:
                du = self._detect_user_stage(text_for_model)
            hw = await get_history_with_window(
                conversation_id,
                max_pairs=settings.chat_history_max_pairs,
                max_chars=settings.chat_history_max_chars,
            )
            recent_questions = extract_recent_questions(hw.window)
            conversation_turn_total = hw.turn_total
            all_stages_coverage = narrative_state.all_stages_coverage()
            persona = normalize_interview_persona(settings.chat_interview_persona)
            max_segments = int(settings.chat_interview_max_segments)
            max_tokens = int(settings.chat_interview_max_tokens)
            max_chars = int(settings.chat_interview_max_chars_per_segment)

            turn_plan = plan_interview_turn(
                current_stage=memoir_state.current_stage,
                empty_slots=empty_slots,
                normalized_user_message=text_for_model,
                memory_evidence_text=(memory_anchor_source or "").strip(),
                stage_switched_this_turn=stage_switched_this_turn,
            )
            logger.info(
                "event=interview_turn_plan mode={} anchor_slot={} snippet_len={}",
                turn_plan.mode,
                turn_plan.anchor_slot_key or "-",
                len(turn_plan.anchor_snippet or ""),
            )

            reply_planner_raw = ""
            baseline_mode = turn_plan.mode
            baseline_primary_focus = turn_plan.primary_focus
            if settings.chat_reply_planner_llm_enabled:
                rq_preview = (
                    "\n".join(recent_questions[-4:])
                    if recent_questions
                    else ""
                )
                turn_plan, reply_planner_raw = await maybe_refine_turn_plan_with_llm(
                    self.llm,
                    plan=turn_plan,
                    text_for_model=text_for_model,
                    memory_evidence_text=(memory_planner_text or memory_evidence_text)
                    or "",
                    max_tokens=int(settings.chat_reply_planner_max_tokens),
                    temperature=float(settings.chat_reply_planner_temperature),
                    scene_cues_for_planner=scene_cues_for_planner or [],
                    recent_questions_preview=rq_preview,
                )
                if reply_planner_raw:
                    logger.info(
                        "event=reply_planner_applied memory_usage={} reply_shape={} "
                        "mode={} primary_focus={} focus_source={}",
                        turn_plan.memory_usage,
                        turn_plan.reply_shape,
                        turn_plan.mode,
                        turn_plan.primary_focus,
                        turn_plan.focus_source,
                    )

            ctx = ChatPromptContext(
                current_stage=memoir_state.current_stage,
                empty_slots=empty_slots,
                filled_slots=filled_slots,
                all_stages_coverage=all_stages_coverage,
                detected_user_stage=du,
                user_profile_context=user_profile_context,
                persona=persona,
                memory_evidence_text=memory_evidence_text,
                background_voice=background_voice,
                occupation=occupation,
                profile_birth_year=profile_birth_year,
                profile_era_place=profile_era_place,
                known_facts=memoir_state.known_facts,
                persona_threads=memoir_state.persona_threads,
                recent_questions=recent_questions or memoir_state.recent_questions,
                turn_plan=turn_plan,
            )
            system_prompt = ctx.guided_system_prompt()
            messages: List[Any] = [SystemMessage(content=system_prompt)]
            messages.extend(hw.window)
            messages.append(HumanMessage(content=text_for_model))
            history_pairs_windowed = len(hw.window) // 2
            window_chars = sum(len(getattr(m, "content", "") or "") for m in hw.window)
            logger.info(
                "event=history_window_applied total={} windowed={} chars={}",
                conversation_turn_total,
                history_pairs_windowed,
                window_chars,
            )
            log_agent_payload(
                logger,
                "InterviewAgent.generate_response.prompt",
                format_history_string(
                    messages,
                    omit_system_body=settings.agent_log_omit_system_message_body,
                ),
            )
            chat_llm = self.llm.bind(
                max_tokens=max_tokens,
                temperature=float(settings.chat_interview_temperature),
            )
            prompt_chars = _message_contents_char_count(messages)
            llm_t0 = time.perf_counter()
            with agent_span(
                logger,
                "InterviewAgent.generate_response.llm",
                conversation_id=conversation_id,
                stage=memoir_state.current_stage,
            ):
                logger.info(
                    "event=chat_prompt_built agent=InterviewAgent.generate_response_with_state "
                    "prompt_chars={} history_pairs_total={} history_pairs_windowed={}",
                    prompt_chars,
                    conversation_turn_total,
                    history_pairs_windowed,
                )
                response = await chat_llm.ainvoke(messages)
            response_ms = (time.perf_counter() - llm_t0) * 1000
            logger.info(
                "event=chat_llm_done agent=InterviewAgent.generate_response_with_state "
                "response_latency_ms={:.2f}",
                response_ms,
            )
            response_text = (
                response.content if hasattr(response, "content") else str(response)
            )
            log_agent_payload(
                logger, "InterviewAgent.generate_response.raw_response", response_text
            )
            rq_base = recent_questions or memoir_state.recent_questions
            out, deduped = _finalize_chat_segments_after_llm(
                response_text,
                max_segments=max_segments,
                max_chars=max_chars,
                memoir_state=memoir_state,
                recent_questions=rq_base,
            )
            retry_used = False
            if deduped and segments_are_only_duplicate_guard_fallback(out):
                retry_system = (
                    f"{system_prompt}\n\n{_DUPLICATE_GUARD_LLM_RETRY_SYSTEM_APPENDIX}"
                )
                retry_messages: List[Any] = [
                    SystemMessage(content=retry_system),
                    *hw.window,
                    HumanMessage(content=text_for_model),
                ]
                log_agent_payload(
                    logger,
                    "InterviewAgent.generate_response.retry_prompt",
                    format_history_string(
                        retry_messages,
                        omit_system_body=settings.agent_log_omit_system_message_body,
                    ),
                )
                llm_t1 = time.perf_counter()
                with agent_span(
                    logger,
                    "InterviewAgent.generate_response.llm_retry",
                    conversation_id=conversation_id,
                    stage=memoir_state.current_stage,
                ):
                    logger.info(
                        "event=chat_prompt_built agent=InterviewAgent.duplicate_guard_retry "
                        "prompt_chars={} conversation_id={}",
                        _message_contents_char_count(retry_messages),
                        conversation_id,
                    )
                    response_retry = await chat_llm.ainvoke(retry_messages)
                logger.info(
                    "event=chat_llm_done agent=InterviewAgent.duplicate_guard_retry "
                    "response_latency_ms={:.2f}",
                    (time.perf_counter() - llm_t1) * 1000,
                )
                response_text_retry = (
                    response_retry.content
                    if hasattr(response_retry, "content")
                    else str(response_retry)
                )
                log_agent_payload(
                    logger,
                    "InterviewAgent.generate_response.raw_response_retry",
                    response_text_retry,
                )
                out, deduped = _finalize_chat_segments_after_llm(
                    response_text_retry,
                    max_segments=max_segments,
                    max_chars=max_chars,
                    memoir_state=memoir_state,
                    recent_questions=rq_base,
                )
                retry_used = True
            out, auto_bio = apply_autobiographical_boundary_guard(out)
            updated_recent_questions = update_recent_questions(rq_base, out)
            log_agent_summary(
                logger,
                "InterviewAgent.generate_response segments={} conversation_id={} "
                "max_tokens={}",
                len(out),
                conversation_id,
                max_tokens,
            )
            return AgentChatTurn(
                messages=out,
                skip_tts=False,
                interview_state_meta={
                    "recent_questions": updated_recent_questions,
                    "duplicate_question_guard_triggered": deduped,
                    "duplicate_question_guard_llm_retry": retry_used,
                    "autobiographical_boundary_guard_triggered": auto_bio,
                    "reply_planner_llm_used": bool(
                        settings.chat_reply_planner_llm_enabled
                        and (reply_planner_raw or "").strip()
                    ),
                    "reply_planner_raw_preview": (reply_planner_raw or "")[:800],
                    "focus_planner_baseline_mode": baseline_mode,
                    "focus_planner_baseline_primary_focus": baseline_primary_focus,
                    "focus_planner_mode": turn_plan.mode,
                    "focus_planner_primary_focus": turn_plan.primary_focus,
                    "focus_planner_focus_source": turn_plan.focus_source,
                    "focus_planner_focus_summary": (turn_plan.focus_summary or "")[:200],
                },
            )
        except Exception as e:
            logger.error("生成回应失败: {}", e, exc_info=True)
            return AgentChatTurn(messages=[_FALLBACK_REPLY], skip_tts=True)

    async def generate_opening_message(
        self,
        conversation_id: str,
        memoir_state: MemoirStateSchema,
        user_profile_context: str = "",
        background_voice: str = "default",
        occupation: str = "",
        profile_birth_year: Optional[int] = None,
        profile_era_place: str = "",
    ) -> List[str]:
        """生成空对话开场白，不持久化（由 Orchestrator 负责）"""
        if not self.llm:
            return ["你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？"]
        try:
            narrative_state = narrative_coverage_state(memoir_state)
            control_state = interview_control_state(memoir_state)
            empty_slots = control_state.prompt_empty_slots_for_stage(
                narrative_state, memoir_state.current_stage
            )
            empty_slots_readable = [SLOT_NAME_MAP.get(s, s) for s in empty_slots]
            persona = normalize_interview_persona(settings.chat_interview_persona)
            prompt = get_opening_prompt(
                current_stage=memoir_state.current_stage,
                empty_slots_readable=empty_slots_readable,
                user_profile_context=user_profile_context,
                persona=persona,
                background_voice=background_voice,
                occupation=occupation,
                profile_birth_year=profile_birth_year,
                profile_era_place=profile_era_place,
            )
            hw = await get_history_with_window(
                conversation_id,
                max_pairs=settings.chat_history_max_pairs,
                max_chars=settings.chat_history_max_chars,
            )
            messages: List[Any] = [SystemMessage(content=prompt)]
            messages.extend(hw.window)
            if not hw.window:
                messages.append(
                    HumanMessage(content="（对话刚开始，请自然地说出你的开场白。）")
                )
            else:
                messages.append(
                    HumanMessage(content="（请根据上文，自然接续并说出你的开场白。）")
                )
            log_agent_payload(
                logger,
                "InterviewAgent.opening.prompt",
                format_history_string(
                    messages,
                    omit_system_body=settings.agent_log_omit_system_message_body,
                ),
            )
            opening_llm = self.llm.bind(
                max_tokens=settings.chat_opening_max_tokens,
                temperature=float(settings.chat_interview_temperature),
            )
            prompt_chars = _message_contents_char_count(messages)
            llm_t0 = time.perf_counter()
            with agent_span(
                logger,
                "InterviewAgent.opening.llm",
                conversation_id=conversation_id,
            ):
                logger.info(
                    "event=chat_prompt_built agent=InterviewAgent.generate_opening_message "
                    "prompt_chars={} history_pairs_total={} history_pairs_windowed={}",
                    prompt_chars,
                    hw.turn_total,
                    len(hw.window) // 2,
                )
                response = await opening_llm.ainvoke(messages)
            logger.info(
                "event=chat_llm_done agent=InterviewAgent.generate_opening_message "
                "response_latency_ms={:.2f}",
                (time.perf_counter() - llm_t0) * 1000,
            )
            response_text = (
                response.content if hasattr(response, "content") else str(response)
            )
            log_agent_payload(
                logger, "InterviewAgent.opening.raw_response", response_text
            )
            raw_list = segments_from_llm_response(response_text, max_segments=2)
            if not raw_list:
                raw_list = [response_text.strip()]
            max_chars = int(settings.chat_interview_max_chars_per_segment)
            out = truncate_chat_segments(
                raw_list,
                max_segments=2,
                max_chars_per_segment=max_chars,
            )
            log_agent_summary(
                logger,
                "InterviewAgent.opening segments={} conversation_id={}",
                len(out),
                conversation_id,
            )
            segments = out if out else [response_text.strip()[:max_chars]]
            return nonempty_segments_or_fallback(
                segments,
                fallback="你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？",
            )
        except Exception as e:
            logger.error("生成开场白失败: {}", e, exc_info=True)
            return ["你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？"]
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								"""
 								InterviewAgent：正式访谈 Specialist
 								负责状态感知回复、开场白，不负责 Redis 持久化（由 Orchestrator 统一处理）
 								"""
-												chore/ 删除无用文件

											
										
										
											2026-03-19 14:36:14 +08:00
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								import time
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								from typing import Any, List, Optional
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								from langchain_core.messages import HumanMessage, SystemMessage
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								from app.agents.chat.agent_turn import AgentChatTurn
 								from app.agents.chat.helpers import format_history_string, get_history_with_window
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								from app.agents.chat.interview_state_hints import (
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								    apply_autobiographical_boundary_guard,
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								    apply_duplicate_question_guard,
 								    extract_recent_questions,
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								    segments_are_only_duplicate_guard_fallback,
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								    update_recent_questions,
 								)
-												feat(chat): server-side interview turn plan (mode, anchor slot, snippet)

- Add plan_interview_turn: emotion_first / memoir_push / follow_user_only
- Inject hard directive block at top of guided system prompt
- Pass stage_switched_this_turn from ChatOrchestrator after stage detection
- Log interview_turn_plan for observability; add unit tests

											
										
										
											2026-04-10 13:56:44 +08:00
+								from app.agents.chat.interview_turn_plan import plan_interview_turn
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								from app.agents.chat.personas import normalize_interview_persona
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								from app.agents.chat.prompt_context import ChatPromptContext
-												refactor: 进一步重构agents目录结构 符合多agent架构

											
										
										
											2026-03-19 10:54:48 +08:00
+								from app.agents.chat.prompts_conversation import (
 								    SLOT_NAME_MAP,
 								    get_opening_prompt,
 								)
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								from app.agents.chat.reply_limits import (
 								    nonempty_segments_or_fallback,
 								    segments_from_llm_response,
 								    truncate_chat_segments,
 								)
-												feat(api): 收敛对话与记忆流程边界，引入 LLM 网关与专用服务

- MemoryService 异步路径委托 MemoryIngestService / MemoryRetrievalService；富化派发经 MemoryEnrichmentScheduler
- WebSocket pipeline 经 ChatTurnService 与显式 DTO 编排单轮对话；回忆录片段入队由 MemoirIngestScheduler 封装
- 新增 LlmGateway（LlmUseCase），各 agent、任务与适配器对齐 ports
- 补充 memory 提示适配、runtime 类型、memory-retrieval 文档、ai-touchpoints 说明与扫描脚本及配套测试

Made-with: Cursor

											
										
										
											2026-04-30 09:17:01 +08:00
+								from app.agents.chat.reply_planner import maybe_refine_turn_plan_with_llm
-												feat: 回忆录证据血缘与内部评测可追溯，顺带对齐本地评测台与 CI

数据库与模型：新增多版迁移（章节证据快照、对话血缘、记忆事实/时间线 lineage 等），把「成稿 ↔ 对话/记忆」的溯源信息落到表结构里。
业务链路：会话与 WS、回忆录/故事流水线、记忆写入与 enrichment 等跟着接上线索与快照；新增章节证据快照与评测侧 EvalTraceService 等模块，方便组评审用的证据包。
内部评测：自动化 run 与手工 memoir 评审共用可追溯证据；rubric/ judge 相关脚本与文档有配套调整。
app-eval-web：Memoir/实验详情里能展开看证据摘要与 evidence_trace（含对话轮次 id）；Vite 代理与 development.sh 注入的 API 端口与当前默认内部评测端口一致，避免改端口后页面连错服务。
工程杂项：GitHub Actions / 仓库说明有更新；各适配器与支付/配额/plan 等多处为小改动或跟随主改动的收尾；新增/扩充了?

											
										
										
											2026-04-08 15:37:09 +08:00
+								from app.agents.chat.stage_detection import keyword_fallback_primary_stage
-												feat(api)!: memory single chain — async MemoryService, strict eval closure

Route all memory ingest/retrieve/enrichment/compaction through async MemoryService.
Remove legacy sync memory implementations (ingest/retrieve/compaction); Celery and
memoir Phase2 call asyncio.run into MemoryService-backed helpers.

Memoir Phase1 batch ingest uses MemoryService.ingest_transcripts_batch; drop chapters.
evidence_bundle_json mirror (Alembic 0015). Evaluation uses snapshot/link-only bundles;
raise EvidenceClosureMissing instead of partial/fallback lineage tiers.

Split memoir state into NarrativeCoverageState and InterviewControlState; delete the
_interview_meta_store adapter layer. Remove rolling-query and recent-fact fallback
settings from config and evidence assembly.

Update judges, docs, tests, and PlaygroundPage alignment.

Made-with: Cursor

											
										
										
											2026-04-30 14:11:46 +08:00
+								from app.agents.state_schema import (
 								    MemoirStateSchema,
 								    interview_control_state,
 								    narrative_coverage_state,
 								)
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								from app.core.agent_logging import (
 								    agent_span,
 								    log_agent_payload,
 								    log_agent_summary,
 								)
 								from app.core.config import settings
-												feat(api): 收敛对话与记忆流程边界，引入 LLM 网关与专用服务

- MemoryService 异步路径委托 MemoryIngestService / MemoryRetrievalService；富化派发经 MemoryEnrichmentScheduler
- WebSocket pipeline 经 ChatTurnService 与显式 DTO 编排单轮对话；回忆录片段入队由 MemoirIngestScheduler 封装
- 新增 LlmGateway（LlmUseCase），各 agent、任务与适配器对齐 ports
- 补充 memory 提示适配、runtime 类型、memory-retrieval 文档、ai-touchpoints 说明与扫描脚本及配套测试

Made-with: Cursor

											
										
										
											2026-04-30 09:17:01 +08:00
+								from app.core.llm_gateway import LlmGateway, LlmUseCase
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								from app.core.logging import get_logger
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								from app.features.conversation.input_normalize import normalize_chat_input_for_agent
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
 								logger = get_logger(__name__)
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								# LLM 不可用或调用失败时对用户展示（不暴露异常细节、不触发 TTS）
 								_FALLBACK_REPLY = "刚才网络不太稳，没接上。你可以再说一遍，或稍后再试。"
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								# 仅在「重复问句守卫」把正文削成单句兜底时追加二次 system，只多调一次模型。
 								_DUPLICATE_GUARD_LLM_RETRY_SYSTEM_APPENDIX = """## 二次生成（纠偏）
 								上一版模型输出因包含与「最近已问过的问题」或「已确认事实」重复的问句，已被系统弃用。请**重新写一整条回复**：
 								- 仍须遵守上文全部主规则；
 								- 先贴着用户本轮原话承接半句到一两句（可有画面感）；
 								- **禁止**再用与刚才同义、仅换说法的确认型问句；
 								- 若要提问，须换**全新角度**，并锚在用户刚说的具体细节里；也可以本轮**完全不提问**，只并肩承接；
 								- **禁止**整段只有「这一段我记住了」或同类无信息套话。"""
 								def _finalize_chat_segments_after_llm(
 								    response_text: str,
 								    *,
 								    max_segments: int,
 								    max_chars: int,
 								    memoir_state: MemoirStateSchema,
 								    recent_questions: list[str],
 								) -> tuple[list[str], bool]:
 								    raw_list = segments_from_llm_response(
 								        response_text,
 								        max_segments=max_segments,
 								    )
 								    if not raw_list:
 								        raw_list = [response_text.strip()]
 								    out = truncate_chat_segments(
 								        raw_list,
 								        max_segments=max_segments,
 								        max_chars_per_segment=max_chars,
 								    )
 								    if not out:
 								        out = [response_text.strip()[:max_chars]]
 								    out = nonempty_segments_or_fallback(out, fallback=_FALLBACK_REPLY)
 								    out, deduped = apply_duplicate_question_guard(
 								        out,
 								        state=memoir_state,
 								        recent_questions=recent_questions,
 								    )
 								    return out, deduped
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
 								def _get_langchain_llm():
 								    try:
-												feat(api): 收敛对话与记忆流程边界，引入 LLM 网关与专用服务

- MemoryService 异步路径委托 MemoryIngestService / MemoryRetrievalService；富化派发经 MemoryEnrichmentScheduler
- WebSocket pipeline 经 ChatTurnService 与显式 DTO 编排单轮对话；回忆录片段入队由 MemoirIngestScheduler 封装
- 新增 LlmGateway（LlmUseCase），各 agent、任务与适配器对齐 ports
- 补充 memory 提示适配、runtime 类型、memory-retrieval 文档、ai-touchpoints 说明与扫描脚本及配套测试

Made-with: Cursor

											
										
										
											2026-04-30 09:17:01 +08:00
+								        return LlmGateway().langchain_llm_for(LlmUseCase("chat.interview"))
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								    except Exception:
 								        return None
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								def _message_contents_char_count(messages: List[Any]) -> int:
 								    n = 0
 								    for m in messages:
 								        c = getattr(m, "content", None)
 								        if isinstance(c, str):
 								            n += len(c)
 								    return n
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								class InterviewAgent:
 								    """正式访谈 Specialist Agent"""
 								    def __init__(self):
 								        self.llm = _get_langchain_llm()
 								    def _detect_user_stage(self, user_message: str) -> str:
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								        """关键词回退：与 stage_detection 一致（多阶段打分）。"""
 								        return keyword_fallback_primary_stage(user_message)
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								    def _resolve_text_for_model(
 								        self,
 								        user_message: str,
 								        normalized_user_message: Optional[str],
 								    ) -> str:
 								        """模型侧净稿：编排层已归一则直接用；否则在本层补一次（含可选 LLM）。"""
 								        if normalized_user_message is not None:
 								            return (normalized_user_message or "").strip()
 								        llm_n = None
 								        if settings.chat_input_normalize_enabled and (
 								            (settings.chat_input_normalize_mode or "").strip().lower() == "llm"
 								        ):
 								            llm_n = self.llm
 								        return normalize_chat_input_for_agent(user_message or "", llm=llm_n)
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
 								    async def generate_response_with_state(
 								        self,
 								        conversation_id: str,
 								        user_message: str,
 								        memoir_state: MemoirStateSchema,
 								        user_profile_context: str = "",
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								        detected_user_stage: Optional[str] = None,
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								        memory_evidence_text: str = "",
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								        memory_anchor_source: str = "",
 								        memory_planner_text: str = "",
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								        background_voice: str = "default",
 								        normalized_user_message: Optional[str] = None,
-												feat(api): 叙事 prompt、职业上下文、读路径章节、WS 解耦与错误脱敏

- 回忆录：事实边界补充允许清单；传记文体示例与 JSON 叙事要求对齐
- default 职业提示 occupation_context；cadre/military 退休语境
- GET 章节读路径零写入，prepare_chapter_read_view + markdown_for_response
- 文本归一抽到 core/text_normalize；移除弃用 reply 策略与 recompose_chapters_for_story
- ConversationService：WS 连接/用户段落/结束对话；对外错误固定文案
- 测试：HTTP 脱敏契约、章节读视图、occupation 与 background_voice

											
										
										
											2026-04-01 11:49:33 +08:00
+								        occupation: str = "",
-												feat: 回忆录证据血缘与内部评测可追溯，顺带对齐本地评测台与 CI

数据库与模型：新增多版迁移（章节证据快照、对话血缘、记忆事实/时间线 lineage 等），把「成稿 ↔ 对话/记忆」的溯源信息落到表结构里。
业务链路：会话与 WS、回忆录/故事流水线、记忆写入与 enrichment 等跟着接上线索与快照；新增章节证据快照与评测侧 EvalTraceService 等模块，方便组评审用的证据包。
内部评测：自动化 run 与手工 memoir 评审共用可追溯证据；rubric/ judge 相关脚本与文档有配套调整。
app-eval-web：Memoir/实验详情里能展开看证据摘要与 evidence_trace（含对话轮次 id）；Vite 代理与 development.sh 注入的 API 端口与当前默认内部评测端口一致，避免改端口后页面连错服务。
工程杂项：GitHub Actions / 仓库说明有更新；各适配器与支付/配额/plan 等多处为小改动或跟随主改动的收尾；新增/扩充了?

											
										
										
											2026-04-08 15:37:09 +08:00
+								        profile_birth_year: int | None = None,
 								        profile_era_place: str = "",
-												feat(chat): server-side interview turn plan (mode, anchor slot, snippet)

- Add plan_interview_turn: emotion_first / memoir_push / follow_user_only
- Inject hard directive block at top of guided system prompt
- Pass stage_switched_this_turn from ChatOrchestrator after stage detection
- Log interview_turn_plan for observability; add unit tests

											
										
										
											2026-04-10 13:56:44 +08:00
+								        stage_switched_this_turn: bool = False,
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								        scene_cues_for_planner: Optional[list[str]] = None,
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								    ) -> AgentChatTurn:
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								        """生成状态感知的访谈回复，不持久化（由 Orchestrator 负责）"""
 								        if not self.llm:
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								            logger.warning("InterviewAgent: LLM 未配置，返回兜底文案")
 								            return AgentChatTurn(messages=[_FALLBACK_REPLY], skip_tts=True)
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								        try:
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								            text_for_model = self._resolve_text_for_model(
 								                user_message, normalized_user_message
 								            )
-												feat(api)!: memory single chain — async MemoryService, strict eval closure

Route all memory ingest/retrieve/enrichment/compaction through async MemoryService.
Remove legacy sync memory implementations (ingest/retrieve/compaction); Celery and
memoir Phase2 call asyncio.run into MemoryService-backed helpers.

Memoir Phase1 batch ingest uses MemoryService.ingest_transcripts_batch; drop chapters.
evidence_bundle_json mirror (Alembic 0015). Evaluation uses snapshot/link-only bundles;
raise EvidenceClosureMissing instead of partial/fallback lineage tiers.

Split memoir state into NarrativeCoverageState and InterviewControlState; delete the
_interview_meta_store adapter layer. Remove rolling-query and recent-fact fallback
settings from config and evidence assembly.

Update judges, docs, tests, and PlaygroundPage alignment.

Made-with: Cursor

											
										
										
											2026-04-30 14:11:46 +08:00
+								            narrative_state = narrative_coverage_state(memoir_state)
 								            control_state = interview_control_state(memoir_state)
 								            empty_slots = control_state.prompt_empty_slots_for_stage(
 								                narrative_state, memoir_state.current_stage
 								            )
 								            filled_slots = narrative_state.filled_slots_for_stage(
 								                memoir_state.current_stage
 								            )
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            if detected_user_stage is not None:
 								                du = detected_user_stage
 								            else:
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								                du = self._detect_user_stage(text_for_model)
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            hw = await get_history_with_window(
 								                conversation_id,
 								                max_pairs=settings.chat_history_max_pairs,
 								                max_chars=settings.chat_history_max_chars,
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								            )
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								            recent_questions = extract_recent_questions(hw.window)
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            conversation_turn_total = hw.turn_total
-												feat(api)!: memory single chain — async MemoryService, strict eval closure

Route all memory ingest/retrieve/enrichment/compaction through async MemoryService.
Remove legacy sync memory implementations (ingest/retrieve/compaction); Celery and
memoir Phase2 call asyncio.run into MemoryService-backed helpers.

Memoir Phase1 batch ingest uses MemoryService.ingest_transcripts_batch; drop chapters.
evidence_bundle_json mirror (Alembic 0015). Evaluation uses snapshot/link-only bundles;
raise EvidenceClosureMissing instead of partial/fallback lineage tiers.

Split memoir state into NarrativeCoverageState and InterviewControlState; delete the
_interview_meta_store adapter layer. Remove rolling-query and recent-fact fallback
settings from config and evidence assembly.

Update judges, docs, tests, and PlaygroundPage alignment.

Made-with: Cursor

											
										
										
											2026-04-30 14:11:46 +08:00
+								            all_stages_coverage = narrative_state.all_stages_coverage()
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								            persona = normalize_interview_persona(settings.chat_interview_persona)
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								            max_segments = int(settings.chat_interview_max_segments)
 								            max_tokens = int(settings.chat_interview_max_tokens)
 								            max_chars = int(settings.chat_interview_max_chars_per_segment)
-												feat(chat): server-side interview turn plan (mode, anchor slot, snippet)

- Add plan_interview_turn: emotion_first / memoir_push / follow_user_only
- Inject hard directive block at top of guided system prompt
- Pass stage_switched_this_turn from ChatOrchestrator after stage detection
- Log interview_turn_plan for observability; add unit tests

											
										
										
											2026-04-10 13:56:44 +08:00
+								            turn_plan = plan_interview_turn(
 								                current_stage=memoir_state.current_stage,
 								                empty_slots=empty_slots,
 								                normalized_user_message=text_for_model,
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								                memory_evidence_text=(memory_anchor_source or "").strip(),
-												feat(chat): server-side interview turn plan (mode, anchor slot, snippet)

- Add plan_interview_turn: emotion_first / memoir_push / follow_user_only
- Inject hard directive block at top of guided system prompt
- Pass stage_switched_this_turn from ChatOrchestrator after stage detection
- Log interview_turn_plan for observability; add unit tests

											
										
										
											2026-04-10 13:56:44 +08:00
+								                stage_switched_this_turn=stage_switched_this_turn,
 								            )
 								            logger.info(
 								                "event=interview_turn_plan mode={} anchor_slot={} snippet_len={}",
 								                turn_plan.mode,
 								                turn_plan.anchor_slot_key or "-",
 								                len(turn_plan.anchor_snippet or ""),
 								            )
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								            reply_planner_raw = ""
 								            baseline_mode = turn_plan.mode
 								            baseline_primary_focus = turn_plan.primary_focus
 								            if settings.chat_reply_planner_llm_enabled:
 								                rq_preview = (
 								                    "\n".join(recent_questions[-4:])
 								                    if recent_questions
 								                    else ""
 								                )
 								                turn_plan, reply_planner_raw = await maybe_refine_turn_plan_with_llm(
 								                    self.llm,
 								                    plan=turn_plan,
 								                    text_for_model=text_for_model,
 								                    memory_evidence_text=(memory_planner_text or memory_evidence_text)
 								                    or "",
 								                    max_tokens=int(settings.chat_reply_planner_max_tokens),
 								                    temperature=float(settings.chat_reply_planner_temperature),
 								                    scene_cues_for_planner=scene_cues_for_planner or [],
 								                    recent_questions_preview=rq_preview,
 								                )
 								                if reply_planner_raw:
 								                    logger.info(
 								                        "event=reply_planner_applied memory_usage={} reply_shape={} "
 								                        "mode={} primary_focus={} focus_source={}",
 								                        turn_plan.memory_usage,
 								                        turn_plan.reply_shape,
 								                        turn_plan.mode,
 								                        turn_plan.primary_focus,
 								                        turn_plan.focus_source,
 								                    )
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            ctx = ChatPromptContext(
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								                current_stage=memoir_state.current_stage,
 								                empty_slots=empty_slots,
 								                filled_slots=filled_slots,
 								                all_stages_coverage=all_stages_coverage,
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								                detected_user_stage=du,
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								                user_profile_context=user_profile_context,
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								                persona=persona,
 								                memory_evidence_text=memory_evidence_text,
 								                background_voice=background_voice,
-												feat(api): 叙事 prompt、职业上下文、读路径章节、WS 解耦与错误脱敏

- 回忆录：事实边界补充允许清单；传记文体示例与 JSON 叙事要求对齐
- default 职业提示 occupation_context；cadre/military 退休语境
- GET 章节读路径零写入，prepare_chapter_read_view + markdown_for_response
- 文本归一抽到 core/text_normalize；移除弃用 reply 策略与 recompose_chapters_for_story
- ConversationService：WS 连接/用户段落/结束对话；对外错误固定文案
- 测试：HTTP 脱敏契约、章节读视图、occupation 与 background_voice

											
										
										
											2026-04-01 11:49:33 +08:00
+								                occupation=occupation,
-												feat: 回忆录证据血缘与内部评测可追溯，顺带对齐本地评测台与 CI

数据库与模型：新增多版迁移（章节证据快照、对话血缘、记忆事实/时间线 lineage 等），把「成稿 ↔ 对话/记忆」的溯源信息落到表结构里。
业务链路：会话与 WS、回忆录/故事流水线、记忆写入与 enrichment 等跟着接上线索与快照；新增章节证据快照与评测侧 EvalTraceService 等模块，方便组评审用的证据包。
内部评测：自动化 run 与手工 memoir 评审共用可追溯证据；rubric/ judge 相关脚本与文档有配套调整。
app-eval-web：Memoir/实验详情里能展开看证据摘要与 evidence_trace（含对话轮次 id）；Vite 代理与 development.sh 注入的 API 端口与当前默认内部评测端口一致，避免改端口后页面连错服务。
工程杂项：GitHub Actions / 仓库说明有更新；各适配器与支付/配额/plan 等多处为小改动或跟随主改动的收尾；新增/扩充了?

											
										
										
											2026-04-08 15:37:09 +08:00
+								                profile_birth_year=profile_birth_year,
 								                profile_era_place=profile_era_place,
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								                known_facts=memoir_state.known_facts,
 								                persona_threads=memoir_state.persona_threads,
 								                recent_questions=recent_questions or memoir_state.recent_questions,
-												feat(chat): server-side interview turn plan (mode, anchor slot, snippet)

- Add plan_interview_turn: emotion_first / memoir_push / follow_user_only
- Inject hard directive block at top of guided system prompt
- Pass stage_switched_this_turn from ChatOrchestrator after stage detection
- Log interview_turn_plan for observability; add unit tests

											
										
										
											2026-04-10 13:56:44 +08:00
+								                turn_plan=turn_plan,
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								            )
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            system_prompt = ctx.guided_system_prompt()
 								            messages: List[Any] = [SystemMessage(content=system_prompt)]
 								            messages.extend(hw.window)
 								            messages.append(HumanMessage(content=text_for_model))
 								            history_pairs_windowed = len(hw.window) // 2
 								            window_chars = sum(len(getattr(m, "content", "") or "") for m in hw.window)
 								            logger.info(
 								                "event=history_window_applied total={} windowed={} chars={}",
 								                conversation_turn_total,
 								                history_pairs_windowed,
 								                window_chars,
 								            )
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            log_agent_payload(
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								                logger,
 								                "InterviewAgent.generate_response.prompt",
-												chore/ 精简展示AI活动的日志

											
										
										
											2026-04-03 13:49:24 +08:00
+								                format_history_string(
 								                    messages,
 								                    omit_system_body=settings.agent_log_omit_system_message_body,
 								                ),
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            )
-												feat:
1. 建立问题库大纲，对应每个人生阶段槽位
2. 鼓励使用更生活化的交流语言共情与总结
3. 降低评审模型可能发生截断的概率
4. 成稿质量维度强化情感表达和上下文连贯性

											
										
										
											2026-04-09 15:32:35 +08:00
+								            chat_llm = self.llm.bind(
 								                max_tokens=max_tokens,
 								                temperature=float(settings.chat_interview_temperature),
 								            )
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            prompt_chars = _message_contents_char_count(messages)
 								            llm_t0 = time.perf_counter()
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            with agent_span(
 								                logger,
 								                "InterviewAgent.generate_response.llm",
 								                conversation_id=conversation_id,
 								                stage=memoir_state.current_stage,
 								            ):
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								                logger.info(
 								                    "event=chat_prompt_built agent=InterviewAgent.generate_response_with_state "
 								                    "prompt_chars={} history_pairs_total={} history_pairs_windowed={}",
 								                    prompt_chars,
 								                    conversation_turn_total,
 								                    history_pairs_windowed,
 								                )
 								                response = await chat_llm.ainvoke(messages)
 								            response_ms = (time.perf_counter() - llm_t0) * 1000
 								            logger.info(
 								                "event=chat_llm_done agent=InterviewAgent.generate_response_with_state "
 								                "response_latency_ms={:.2f}",
 								                response_ms,
 								            )
-												chore/ 删除无用文件

											
										
										
											2026-03-19 14:36:14 +08:00
+								            response_text = (
 								                response.content if hasattr(response, "content") else str(response)
 								            )
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            log_agent_payload(
 								                logger, "InterviewAgent.generate_response.raw_response", response_text
 								            )
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								            rq_base = recent_questions or memoir_state.recent_questions
 								            out, deduped = _finalize_chat_segments_after_llm(
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								                response_text,
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								                max_segments=max_segments,
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								                max_chars=max_chars,
 								                memoir_state=memoir_state,
 								                recent_questions=rq_base,
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								            )
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								            retry_used = False
 								            if deduped and segments_are_only_duplicate_guard_fallback(out):
 								                retry_system = (
 								                    f"{system_prompt}\n\n{_DUPLICATE_GUARD_LLM_RETRY_SYSTEM_APPENDIX}"
 								                )
 								                retry_messages: List[Any] = [
 								                    SystemMessage(content=retry_system),
 								                    *hw.window,
 								                    HumanMessage(content=text_for_model),
 								                ]
 								                log_agent_payload(
 								                    logger,
 								                    "InterviewAgent.generate_response.retry_prompt",
 								                    format_history_string(
 								                        retry_messages,
 								                        omit_system_body=settings.agent_log_omit_system_message_body,
 								                    ),
 								                )
 								                llm_t1 = time.perf_counter()
 								                with agent_span(
 								                    logger,
 								                    "InterviewAgent.generate_response.llm_retry",
 								                    conversation_id=conversation_id,
 								                    stage=memoir_state.current_stage,
 								                ):
 								                    logger.info(
 								                        "event=chat_prompt_built agent=InterviewAgent.duplicate_guard_retry "
 								                        "prompt_chars={} conversation_id={}",
 								                        _message_contents_char_count(retry_messages),
 								                        conversation_id,
 								                    )
 								                    response_retry = await chat_llm.ainvoke(retry_messages)
 								                logger.info(
 								                    "event=chat_llm_done agent=InterviewAgent.duplicate_guard_retry "
 								                    "response_latency_ms={:.2f}",
 								                    (time.perf_counter() - llm_t1) * 1000,
 								                )
 								                response_text_retry = (
 								                    response_retry.content
 								                    if hasattr(response_retry, "content")
 								                    else str(response_retry)
 								                )
 								                log_agent_payload(
 								                    logger,
 								                    "InterviewAgent.generate_response.raw_response_retry",
 								                    response_text_retry,
 								                )
 								                out, deduped = _finalize_chat_segments_after_llm(
 								                    response_text_retry,
 								                    max_segments=max_segments,
 								                    max_chars=max_chars,
 								                    memoir_state=memoir_state,
 								                    recent_questions=rq_base,
 								                )
 								                retry_used = True
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								            out, auto_bio = apply_autobiographical_boundary_guard(out)
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								            updated_recent_questions = update_recent_questions(rq_base, out)
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            log_agent_summary(
 								                logger,
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								                "InterviewAgent.generate_response segments={} conversation_id={} "
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								                "max_tokens={}",
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								                len(out),
 								                conversation_id,
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								                max_tokens,
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            )
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								            return AgentChatTurn(
 								                messages=out,
 								                skip_tts=False,
 								                interview_state_meta={
 								                    "recent_questions": updated_recent_questions,
 								                    "duplicate_question_guard_triggered": deduped,
-												fix(chat): 重复追问被拦截时再多问一次模型

防重复问句会把整段回复削成「这一段我记住了。」只剩一句套话时，用带纠偏说明的 system 再调一次 LLM，尽量避免用户只看到干巴巴_ack。仍只重试一次，并打日志与 meta 标记 duplicate_question_guard_llm_retry。

											
										
										
											2026-04-10 15:33:28 +08:00
+								                    "duplicate_question_guard_llm_retry": retry_used,
-												WIP: memory system improvements (in progress)

Interview/chat prompt layers, reply planner, style profiles, memory
injection, interview meta store, and related tests. Work not finished.

Made-with: Cursor

											
										
										
											2026-04-22 16:56:28 +08:00
+								                    "autobiographical_boundary_guard_triggered": auto_bio,
 								                    "reply_planner_llm_used": bool(
 								                        settings.chat_reply_planner_llm_enabled
 								                        and (reply_planner_raw or "").strip()
 								                    ),
 								                    "reply_planner_raw_preview": (reply_planner_raw or "")[:800],
 								                    "focus_planner_baseline_mode": baseline_mode,
 								                    "focus_planner_baseline_primary_focus": baseline_primary_focus,
 								                    "focus_planner_mode": turn_plan.mode,
 								                    "focus_planner_primary_focus": turn_plan.primary_focus,
 								                    "focus_planner_focus_source": turn_plan.focus_source,
 								                    "focus_planner_focus_summary": (turn_plan.focus_summary or "")[:200],
-												refactor(eval+memoir)：精简内部评测路由与服务，composite/对话摘要与 judge 能力补强

- 访谈：新增 interview_state_hints，联动 orchestrator 与提示词
- 回忆录：story_pipeline_sync/state/memory/post_commit 与 Celery 任务调整
- 基建：开发用 celery broker、compose/development 脚本、依赖注入
- eval-web：移除数据集/实验/版本等页面与流式轮询，突出 Playground
- 文档与单测同步

											
										
										
											2026-04-08 21:36:12 +08:00
+								                },
 								            )
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								        except Exception as e:
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            logger.error("生成回应失败: {}", e, exc_info=True)
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								            return AgentChatTurn(messages=[_FALLBACK_REPLY], skip_tts=True)
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
 								    async def generate_opening_message(
 								        self,
 								        conversation_id: str,
 								        memoir_state: MemoirStateSchema,
 								        user_profile_context: str = "",
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								        background_voice: str = "default",
-												feat(api): 叙事 prompt、职业上下文、读路径章节、WS 解耦与错误脱敏

- 回忆录：事实边界补充允许清单；传记文体示例与 JSON 叙事要求对齐
- default 职业提示 occupation_context；cadre/military 退休语境
- GET 章节读路径零写入，prepare_chapter_read_view + markdown_for_response
- 文本归一抽到 core/text_normalize；移除弃用 reply 策略与 recompose_chapters_for_story
- ConversationService：WS 连接/用户段落/结束对话；对外错误固定文案
- 测试：HTTP 脱敏契约、章节读视图、occupation 与 background_voice

											
										
										
											2026-04-01 11:49:33 +08:00
+								        occupation: str = "",
-												test/ 调整prompt，提高共情能力

											
										
										
											2026-04-08 17:10:09 +08:00
+								        profile_birth_year: Optional[int] = None,
 								        profile_era_place: str = "",
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								    ) -> List[str]:
 								        """生成空对话开场白，不持久化（由 Orchestrator 负责）"""
 								        if not self.llm:
-												feat(chat): host-style memoir prompts and strip parenthetical stage directions

- Add strip_parenthetical_asides_for_chat in reply pipeline before [SPLIT]
- Expand output_rules bans (performance parens) and voice as warm host
- Refocus opening/guided prompts on pulling conversation toward memoir oral history
- Align interview opening fallbacks with memoir-first tone
- Add unit tests for parenthetical stripping

											
										
										
											2026-04-10 13:55:08 +08:00
+								            return ["你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？"]
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								        try:
-												feat(api)!: memory single chain — async MemoryService, strict eval closure

Route all memory ingest/retrieve/enrichment/compaction through async MemoryService.
Remove legacy sync memory implementations (ingest/retrieve/compaction); Celery and
memoir Phase2 call asyncio.run into MemoryService-backed helpers.

Memoir Phase1 batch ingest uses MemoryService.ingest_transcripts_batch; drop chapters.
evidence_bundle_json mirror (Alembic 0015). Evaluation uses snapshot/link-only bundles;
raise EvidenceClosureMissing instead of partial/fallback lineage tiers.

Split memoir state into NarrativeCoverageState and InterviewControlState; delete the
_interview_meta_store adapter layer. Remove rolling-query and recent-fact fallback
settings from config and evidence assembly.

Update judges, docs, tests, and PlaygroundPage alignment.

Made-with: Cursor

											
										
										
											2026-04-30 14:11:46 +08:00
+								            narrative_state = narrative_coverage_state(memoir_state)
 								            control_state = interview_control_state(memoir_state)
 								            empty_slots = control_state.prompt_empty_slots_for_stage(
 								                narrative_state, memoir_state.current_stage
 								            )
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								            empty_slots_readable = [SLOT_NAME_MAP.get(s, s) for s in empty_slots]
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								            persona = normalize_interview_persona(settings.chat_interview_persona)
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								            prompt = get_opening_prompt(
 								                current_stage=memoir_state.current_stage,
 								                empty_slots_readable=empty_slots_readable,
 								                user_profile_context=user_profile_context,
-												feat(api): 访谈人格/回复长度策略、口述归一、背景语气与输入净稿全链路

Chat 访谈
- 新增 persona 系统（default / warm_listener / curious_guide）与 background_voice 语气层
- 回复长度由 compute_reply_plan 统一决策（brief / standard / expanded），融合信息密度启发式
- 输入净稿（input_normalize）：编排层可选 rules/llm 归一用户口语后再喂模型与记忆检索
- 记忆证据注入：按用户话检索 memory evidence 并注入 prompt

Memoir 回忆录
- 口述归一（oral_normalize）：segment 原文保留，story 管线取派生净稿作叙事输入
- segment 入队批次门闸：累计字数 + 最长等待秒数，减少零碎提交
- fidelity_check / prompts / narrative_agent 微调
- Alembic 0005：清理跨章节 story 外键

Infra
- Dockerfile 加入 ffmpeg
- pyproject.toml 新增依赖并同步 uv.lock
- .env.example / .env.production 补全新配置项

Tests
- 新增 test_background_voice、test_chat_input_normalize、test_experience_regressions
- 扩展 test_interview_prompts、test_interview_reply_length、test_story_route_oral_invariant

Made-with: Cursor

											
										
										
											2026-03-31 23:55:26 +08:00
+								                persona=persona,
 								                background_voice=background_voice,
-												feat(api): 叙事 prompt、职业上下文、读路径章节、WS 解耦与错误脱敏

- 回忆录：事实边界补充允许清单；传记文体示例与 JSON 叙事要求对齐
- default 职业提示 occupation_context；cadre/military 退休语境
- GET 章节读路径零写入，prepare_chapter_read_view + markdown_for_response
- 文本归一抽到 core/text_normalize；移除弃用 reply 策略与 recompose_chapters_for_story
- ConversationService：WS 连接/用户段落/结束对话；对外错误固定文案
- 测试：HTTP 脱敏契约、章节读视图、occupation 与 background_voice

											
										
										
											2026-04-01 11:49:33 +08:00
+								                occupation=occupation,
-												test/ 调整prompt，提高共情能力

											
										
										
											2026-04-08 17:10:09 +08:00
+								                profile_birth_year=profile_birth_year,
 								                profile_era_place=profile_era_place,
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								            )
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            hw = await get_history_with_window(
 								                conversation_id,
 								                max_pairs=settings.chat_history_max_pairs,
 								                max_chars=settings.chat_history_max_chars,
 								            )
 								            messages: List[Any] = [SystemMessage(content=prompt)]
 								            messages.extend(hw.window)
 								            if not hw.window:
 								                messages.append(
 								                    HumanMessage(content="（对话刚开始，请自然地说出你的开场白。）")
 								                )
 								            else:
 								                messages.append(
 								                    HumanMessage(content="（请根据上文，自然接续并说出你的开场白。）")
 								                )
 								            log_agent_payload(
 								                logger,
 								                "InterviewAgent.opening.prompt",
-												chore/ 精简展示AI活动的日志

											
										
										
											2026-04-03 13:49:24 +08:00
+								                format_history_string(
 								                    messages,
 								                    omit_system_body=settings.agent_log_omit_system_message_body,
 								                ),
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            )
-												feat:
1. 建立问题库大纲，对应每个人生阶段槽位
2. 鼓励使用更生活化的交流语言共情与总结
3. 降低评审模型可能发生截断的概率
4. 成稿质量维度强化情感表达和上下文连贯性

											
										
										
											2026-04-09 15:32:35 +08:00
+								            opening_llm = self.llm.bind(
 								                max_tokens=settings.chat_opening_max_tokens,
 								                temperature=float(settings.chat_interview_temperature),
 								            )
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								            prompt_chars = _message_contents_char_count(messages)
 								            llm_t0 = time.perf_counter()
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            with agent_span(
 								                logger,
 								                "InterviewAgent.opening.llm",
 								                conversation_id=conversation_id,
 								            ):
-												refactor(agents): 抽取阶段常量与对话上下文；快档 LLM；图片 prompt 可禁止回退

访谈与阶段
- 新增 app/agents/stage_constants.py：集中 CHAT_STAGES、章节分类/顺序、阶段到默认 memoir 类别等，与 MemoirState 默认槽位顺序对齐；减少散落在 prompts 内的重复常量。
- 新增 app/agents/chat/prompt_context.py：以 ChatPromptContext 汇总 guided 系统提示所需字段（阶段、槽位、轮次、人设、记忆证据、回复长度模式、背景声线、职业等），统一走 get_guided_conversation_prompt。
- 大幅收敛 app/agents/chat/prompts_conversation.py；调整 prompts.py、stage_prompts.py、stage_detection.py；同步 interview_agent、profile_agent、helpers 与 state_schema，使对话侧构造提示的方式一致、可测。

回忆录流水线
- memoir/prompts.py 删除已迁至 stage_constants / 独立模板的大段常量与图片占位相关逻辑；classification / extraction / fidelity / narrative agents 与 orchest（全量历史仍可用于计数，注入模型时按轮次与字符上限截断）、image_prompt_fallback_disabled。
- dependencies 增加 get_llm_provider_fast（LRU 缓存，可与默认共用密钥与 base_url）。

任务与编排
- memoir_tasks：prepare_batches 注入 llm_fast；开启独立快档模型时打结构化日志。
- chapter_cover_tasks、story_image_tasks：与图片 prompt / JSON 工具路径或策略变更对齐（import 与行为一致）。
- story_pipeline_sync 等小处同步。

其它核心
- langchain_llm、text_normalize 随上述调用链微调。

开发者体验
- .cursor/settings.json：启用 redis-development、postman 插件。

测试
- 新增 test_image_prompt_policy：覆盖「禁止回退」等图片 prompt 策略。
- 更新 test_interview_prompts、test_interview_reply_length、test_experience_regressions、test_json_and_memory_utils，匹配新常量位置、json_utils 与对话/长度行为。

											
										
										
											2026-04-02 12:00:00 +08:00
+								                logger.info(
 								                    "event=chat_prompt_built agent=InterviewAgent.generate_opening_message "
 								                    "prompt_chars={} history_pairs_total={} history_pairs_windowed={}",
 								                    prompt_chars,
 								                    hw.turn_total,
 								                    len(hw.window) // 2,
 								                )
 								                response = await opening_llm.ainvoke(messages)
 								            logger.info(
 								                "event=chat_llm_done agent=InterviewAgent.generate_opening_message "
 								                "response_latency_ms={:.2f}",
 								                (time.perf_counter() - llm_t0) * 1000,
 								            )
-												chore/ 删除无用文件

											
										
										
											2026-03-19 14:36:14 +08:00
+								            response_text = (
 								                response.content if hasattr(response, "content") else str(response)
 								            )
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            log_agent_payload(
 								                logger, "InterviewAgent.opening.raw_response", response_text
 								            )
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								            raw_list = segments_from_llm_response(response_text, max_segments=2)
 								            if not raw_list:
 								                raw_list = [response_text.strip()]
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								            max_chars = int(settings.chat_interview_max_chars_per_segment)
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            out = truncate_chat_segments(
 								                raw_list,
 								                max_segments=2,
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								                max_chars_per_segment=max_chars,
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            )
 								            log_agent_summary(
 								                logger,
 								                "InterviewAgent.opening segments={} conversation_id={}",
 								                len(out),
 								                conversation_id,
 								            )
-												refactor(chat): AI-native prompts, remove interview heuristics

- Drop interview_reply_length and utterance_substance; always run stage LLM
  and memory retrieval when enabled; trim Settings fields and .env.example.
- Replace guided/opening prompts with compact fact blocks plus unified
  behavior guidance; slim background_voice and persona to tone hints.
- InterviewAgent uses fixed chat_interview max_tokens/chars/segments.

Also includes stacked work: profile followup/extract path, evaluation rubric
and judge schema updates, transcript SPLIT handling in execution service,
user export markdown split tests, and golden case fixture.

											
										
										
											2026-04-06 22:22:50 +08:00
+								            segments = out if out else [response_text.strip()[:max_chars]]
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								            return nonempty_segments_or_fallback(
 								                segments,
-												feat(chat): host-style memoir prompts and strip parenthetical stage directions

- Add strip_parenthetical_asides_for_chat in reply pipeline before [SPLIT]
- Expand output_rules bans (performance parens) and voice as warm host
- Refocus opening/guided prompts on pulling conversation toward memoir oral history
- Align interview opening fallbacks with memoir-first tone
- Add unit tests for parenthetical stripping

											
										
										
											2026-04-10 13:55:08 +08:00
+								                fallback="你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？",
-												feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路

数据库
- 新增迁移 0003：timeline_events.memory_source_id 外键 → memory_sources，便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化（摘要/事实/时间线），可配置开关与最大字符数
- 新增证据包组装：合并 chunk、摘要、事实、时间线、故事等检索结果；支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展；文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG；分段 ASR 日志与空音频处理；转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符，与分段逻辑一致

后端 - Agent
- reply_limits：按 [SPLIT] 与段落拆段，并保证非空 fallback，供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id；任务成功结?

											
										
										
											2026-03-27 16:01:28 +08:00
+								            )
-												feat & refactor: 重构agents目录结构；AI回复模块agent结构封装

											
										
										
											2026-03-19 10:36:55 +08:00
+								        except Exception as e:
-												feat(api+app): 对话阶段化、回忆录流水线与客户端会话体验
- DB: segments 用户输入文本（Alembic 0002）
- Chat: 阶段检测/阶段提示/回复限制，编排与访谈/画像 prompts 调整
- Memoir: 忠实度检查 agent，叙事与分类等链路更新
- Core: agent 日志、Alembic 启动、LangChain/日志/配置等
- Story: time_hints；Memory 检索与相关测试
- Expo: 助手头像、会话页与消息拆分、实时会话与文案/i18n
- Docs/scripts/tests: 迁移脚本、LLM JSON/记忆检索文档、新增单测

											
										
										
											2026-03-26 12:13:36 +08:00
+								            logger.error("生成开场白失败: {}", e, exc_info=True)
-												feat(chat): host-style memoir prompts and strip parenthetical stage directions

- Add strip_parenthetical_asides_for_chat in reply pipeline before [SPLIT]
- Expand output_rules bans (performance parens) and voice as warm host
- Refocus opening/guided prompts on pulling conversation toward memoir oral history
- Align interview opening fallbacks with memoir-first tone
- Add unit tests for parenthetical stripping

											
										
										
											2026-04-10 13:55:08 +08:00
+								            return ["你好呀～ 又见面了。今天想从人生里哪一小段回忆开始聊聊？"]