api/app/features/memoir/asset_resolver.py

"""
asset:// 与正文占位符清理。

从正文移除 {{IMAGE:...}} / {{{{IMAGE:...}}}}（历史正文可能仍含此类标记）。
"""

import re
from typing import Callable

_PLACEHOLDER_RE = re.compile(
    r"\{\{\{\{IMAGE:(.*?)\}\}\}\}|\{\{IMAGE:(.*?)\}\}",
    re.DOTALL,
)

_ASSET_REF_RE = re.compile(r"!\[([^\]]*)\]\(asset://([a-zA-Z0-9_-]+)\)")
_BLANK_RUN_RE = re.compile(r"\n{3,}")


def strip_image_placeholders(text: str | None) -> str:
    """移除正文中的 IMAGE 占位符，保留其余 markdown。"""
    if not text:
        return ""
    return _PLACEHOLDER_RE.sub("", text).strip()


def parse_asset_refs(markdown: str) -> list[tuple[int, int, str, str]]:
    refs = []
    for m in _ASSET_REF_RE.finditer(markdown or ""):
        refs.append((m.start(), m.end(), m.group(1) or "", m.group(2) or ""))
    return refs


def collect_asset_ids_from_markdown(markdown: str) -> list[str]:
    return [m.group(2) for m in _ASSET_REF_RE.finditer(markdown or "") if m.group(2)]


def strip_asset_image_refs_from_markdown(markdown: str | None) -> str:
    """Remove all `![...](asset://...)` references; collapse blank lines.

    Used for story single-primary policy: new versions / backfill must not
    accumulate multiple inline asset images.
    """
    if not markdown or not str(markdown).strip():
        return ""
    text = _ASSET_REF_RE.sub("", markdown or "")
    text = _BLANK_RUN_RE.sub("\n\n", text)
    return text.strip()


def collect_asset_ids_for_chapter(chapter) -> set[str]:
    """章节正文 canonical、收录的各 story 正文、cover_asset_id 中的 asset id。"""
    ids: set[str] = set()
    md = getattr(chapter, "canonical_markdown", None) or ""
    ids.update(collect_asset_ids_from_markdown(md))
    cid = getattr(chapter, "cover_asset_id", None)
    if cid:
        ids.add(str(cid))
    for link in getattr(chapter, "story_links", None) or []:
        st = getattr(link, "story", None)
        if st is None:
            continue
        smd = getattr(st, "canonical_markdown", None) or ""
        ids.update(collect_asset_ids_from_markdown(smd))
        for intent in getattr(st, "image_intents", None) or []:
            if getattr(intent, "intent_role", None) == "primary":
                aid = getattr(intent, "asset_id", None)
                if aid:
                    ids.add(str(aid))
    return ids


def collect_asset_ids_for_chapters(chapters: list) -> set[str]:
    combined: set[str] = set()
    for ch in chapters or []:
        combined |= collect_asset_ids_for_chapter(ch)
    return combined


def split_markdown_by_asset_refs(
    markdown: str,
    resolve_asset: Callable[[str], str | None],
) -> list[dict]:
    blocks: list[dict] = []
    refs = parse_asset_refs(markdown or "")
    if not refs:
        text = (markdown or "").strip()
        if text:
            blocks.append({"type": "text", "value": text})
        return blocks

    pos = 0
    for start, end, caption, asset_id in refs:
        if start > pos:
            text = markdown[pos:start].strip()
            if text:
                blocks.append({"type": "text", "value": text})
        url = resolve_asset(asset_id) if asset_id else None
        if url:
            blocks.append({"type": "image", "url": url, "caption": caption})
        pos = end

    if pos < len(markdown or ""):
        text = markdown[pos:].strip()
        if text:
            blocks.append({"type": "text", "value": text})

    return blocks


def resolve_asset_refs_in_markdown(
    markdown: str,
    resolve_asset: Callable[[str], str | None],
) -> str:
    if not markdown or not resolve_asset:
        return markdown or ""

    def repl(m):
        caption, asset_id = m.group(1) or "", m.group(2) or ""
        url = resolve_asset(asset_id) if asset_id else None
        if url:
            return f"![{caption}]({url})"
        return m.group(0)

    return _ASSET_REF_RE.sub(repl, markdown)
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								"""
-												refactor(api,expo): 多智能体与会话收敛、回忆录兼容层移除、后端测试集大幅删减

- 对齐「多智能体收敛」与「回忆录 stories-first / markdown-first」方向：收紧运行时契约、
  删除过渡兼容路径与双轨逻辑，并同步更新客户端与文档。

- Chat：以 ChatOrchestrator 为实时编排入口；删除独立 conversation_agent，精简 prompts。
- Memoir：删除 memory_agent；MemoirOrchestrator、classification / story_route 与 prompts 收敛到
  prepare_batches + run_story_pipeline_for_category_batch 主链路。
- 将 agents 侧 processor 迁入 feature 层为 background_runner，并移除 features 下重复/过时
  processor 封装。

- 新增 history_store，强化「conversation_messages 为 DB 真源、Redis 为缓存」模型。
- 调整 models、repo、service、session_history；精简 WS message_types，重构 pipeline 与 router。

- 移除章节占位、整章再生等旧路径；章节列表与封面逻辑要求 story 关联；收紧 cover 资格与
  enqueue。
- helpers、repo、service、router、reading_segment_materialize、story_pipeline_sync、pdf_service
  等按 canonical markdown / cover_asset_id 收缩；删除 memoir_images/provider 等冗余。
- tasks：memoir_tasks、chapter_cover_tasks 等大幅瘦身；story_image_tasks 等与当前图片任务对齐。

- core：config、logging、redis、task_tracker 小幅调整。
- auth / user / payment / quota：路由或服务侧删减过时接口或逻辑（如 payment router 行数减少）。

- pyproject.toml、development.sh、.env.example / .env.production、README 等同步说明或变量。

- Alembic 0001_initial_schema 微调（与当前 schema 叙事一致的小改动）。

- 回忆录：types / mappers / api、章节页与 memoir 页与后端契约对齐；markdown-renderer 调整。
- 语音：删除 voice/player，voice-segment-store 相应精简。

- api/tests：删除 conftest 及绝大部分既有测试文件（websocket_baseline、conversation、memoir
  图片、PDF、SMS 等），属有意收缩/待按 backend-test-system 重建的信号。
- docs：新增多智能体收敛与移除兼容层计划摘要；更新 story-first 设计、backend-test-system、
  multi-agent-refactor-plan、实施总结等。

BREAKING CHANGE: 后端对外契约、回忆录章节字段与若干路由/任务行为已变更；大量 API 测试被移除，
  CI 若依赖这些用例需按新策略补测或调整流水线。

											
										
										
											2026-03-22 16:45:57 +08:00
+								asset:// 与正文占位符清理。
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
-												refactor(api,expo): 多智能体与会话收敛、回忆录兼容层移除、后端测试集大幅删减

- 对齐「多智能体收敛」与「回忆录 stories-first / markdown-first」方向：收紧运行时契约、
  删除过渡兼容路径与双轨逻辑，并同步更新客户端与文档。

- Chat：以 ChatOrchestrator 为实时编排入口；删除独立 conversation_agent，精简 prompts。
- Memoir：删除 memory_agent；MemoirOrchestrator、classification / story_route 与 prompts 收敛到
  prepare_batches + run_story_pipeline_for_category_batch 主链路。
- 将 agents 侧 processor 迁入 feature 层为 background_runner，并移除 features 下重复/过时
  processor 封装。

- 新增 history_store，强化「conversation_messages 为 DB 真源、Redis 为缓存」模型。
- 调整 models、repo、service、session_history；精简 WS message_types，重构 pipeline 与 router。

- 移除章节占位、整章再生等旧路径；章节列表与封面逻辑要求 story 关联；收紧 cover 资格与
  enqueue。
- helpers、repo、service、router、reading_segment_materialize、story_pipeline_sync、pdf_service
  等按 canonical markdown / cover_asset_id 收缩；删除 memoir_images/provider 等冗余。
- tasks：memoir_tasks、chapter_cover_tasks 等大幅瘦身；story_image_tasks 等与当前图片任务对齐。

- core：config、logging、redis、task_tracker 小幅调整。
- auth / user / payment / quota：路由或服务侧删减过时接口或逻辑（如 payment router 行数减少）。

- pyproject.toml、development.sh、.env.example / .env.production、README 等同步说明或变量。

- Alembic 0001_initial_schema 微调（与当前 schema 叙事一致的小改动）。

- 回忆录：types / mappers / api、章节页与 memoir 页与后端契约对齐；markdown-renderer 调整。
- 语音：删除 voice/player，voice-segment-store 相应精简。

- api/tests：删除 conftest 及绝大部分既有测试文件（websocket_baseline、conversation、memoir
  图片、PDF、SMS 等），属有意收缩/待按 backend-test-system 重建的信号。
- docs：新增多智能体收敛与移除兼容层计划摘要；更新 story-first 设计、backend-test-system、
  multi-agent-refactor-plan、实施总结等。

BREAKING CHANGE: 后端对外契约、回忆录章节字段与若干路由/任务行为已变更；大量 API 测试被移除，
  CI 若依赖这些用例需按新策略补测或调整流水线。

											
										
										
											2026-03-22 16:45:57 +08:00
+								从正文移除 {{IMAGE:...}} / {{{{IMAGE:...}}}}（历史正文可能仍含此类标记）。
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								"""
 								import re
 								from typing import Callable
 								_PLACEHOLDER_RE = re.compile(
 								    r"\{\{\{\{IMAGE:(.*?)\}\}\}\}|\{\{IMAGE:(.*?)\}\}",
 								    re.DOTALL,
 								)
 								_ASSET_REF_RE = re.compile(r"!\[([^\]]*)\]\(asset://([a-zA-Z0-9_-]+)\)")
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								_BLANK_RUN_RE = re.compile(r"\n{3,}")
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
-												refactor(api,expo): 多智能体与会话收敛、回忆录兼容层移除、后端测试集大幅删减

- 对齐「多智能体收敛」与「回忆录 stories-first / markdown-first」方向：收紧运行时契约、
  删除过渡兼容路径与双轨逻辑，并同步更新客户端与文档。

- Chat：以 ChatOrchestrator 为实时编排入口；删除独立 conversation_agent，精简 prompts。
- Memoir：删除 memory_agent；MemoirOrchestrator、classification / story_route 与 prompts 收敛到
  prepare_batches + run_story_pipeline_for_category_batch 主链路。
- 将 agents 侧 processor 迁入 feature 层为 background_runner，并移除 features 下重复/过时
  processor 封装。

- 新增 history_store，强化「conversation_messages 为 DB 真源、Redis 为缓存」模型。
- 调整 models、repo、service、session_history；精简 WS message_types，重构 pipeline 与 router。

- 移除章节占位、整章再生等旧路径；章节列表与封面逻辑要求 story 关联；收紧 cover 资格与
  enqueue。
- helpers、repo、service、router、reading_segment_materialize、story_pipeline_sync、pdf_service
  等按 canonical markdown / cover_asset_id 收缩；删除 memoir_images/provider 等冗余。
- tasks：memoir_tasks、chapter_cover_tasks 等大幅瘦身；story_image_tasks 等与当前图片任务对齐。

- core：config、logging、redis、task_tracker 小幅调整。
- auth / user / payment / quota：路由或服务侧删减过时接口或逻辑（如 payment router 行数减少）。

- pyproject.toml、development.sh、.env.example / .env.production、README 等同步说明或变量。

- Alembic 0001_initial_schema 微调（与当前 schema 叙事一致的小改动）。

- 回忆录：types / mappers / api、章节页与 memoir 页与后端契约对齐；markdown-renderer 调整。
- 语音：删除 voice/player，voice-segment-store 相应精简。

- api/tests：删除 conftest 及绝大部分既有测试文件（websocket_baseline、conversation、memoir
  图片、PDF、SMS 等），属有意收缩/待按 backend-test-system 重建的信号。
- docs：新增多智能体收敛与移除兼容层计划摘要；更新 story-first 设计、backend-test-system、
  multi-agent-refactor-plan、实施总结等。

BREAKING CHANGE: 后端对外契约、回忆录章节字段与若干路由/任务行为已变更；大量 API 测试被移除，
  CI 若依赖这些用例需按新策略补测或调整流水线。

											
										
										
											2026-03-22 16:45:57 +08:00
+								def strip_image_placeholders(text: str | None) -> str:
 								    """移除正文中的 IMAGE 占位符，保留其余 markdown。"""
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								    if not text:
 								        return ""
 								    return _PLACEHOLDER_RE.sub("", text).strip()
 								def parse_asset_refs(markdown: str) -> list[tuple[int, int, str, str]]:
 								    refs = []
 								    for m in _ASSET_REF_RE.finditer(markdown or ""):
 								        refs.append((m.start(), m.end(), m.group(1) or "", m.group(2) or ""))
 								    return refs
 								def collect_asset_ids_from_markdown(markdown: str) -> list[str]:
 								    return [m.group(2) for m in _ASSET_REF_RE.finditer(markdown or "") if m.group(2)]
-												修复一些已知问题

											
										
										
											2026-03-20 17:25:42 +08:00
+								def strip_asset_image_refs_from_markdown(markdown: str | None) -> str:
 								    """Remove all `![...](asset://...)` references; collapse blank lines.
 								    Used for story single-primary policy: new versions / backfill must not
 								    accumulate multiple inline asset images.
 								    """
 								    if not markdown or not str(markdown).strip():
 								        return ""
 								    text = _ASSET_REF_RE.sub("", markdown or "")
 								    text = _BLANK_RUN_RE.sub("\n\n", text)
 								    return text.strip()
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								def collect_asset_ids_for_chapter(chapter) -> set[str]:
-												fix/various fixes

											
										
										
											2026-03-20 15:15:35 +08:00
+								    """章节正文 canonical、收录的各 story 正文、cover_asset_id 中的 asset id。"""
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								    ids: set[str] = set()
 								    md = getattr(chapter, "canonical_markdown", None) or ""
 								    ids.update(collect_asset_ids_from_markdown(md))
 								    cid = getattr(chapter, "cover_asset_id", None)
 								    if cid:
 								        ids.add(str(cid))
-												fix/various fixes

											
										
										
											2026-03-20 15:15:35 +08:00
+								    for link in getattr(chapter, "story_links", None) or []:
 								        st = getattr(link, "story", None)
 								        if st is None:
 								            continue
 								        smd = getattr(st, "canonical_markdown", None) or ""
 								        ids.update(collect_asset_ids_from_markdown(smd))
-												修复：CI 部署环境与 ref 错配、迁移碎片化、图片意图 source_span、章节物化脏版式、会话历史与本地语音不一致

新增：TTS 上传 COS 与分片、章节 reading_segments 物化与快照、markdown 清洗、会话消息 repository、语音 store 重构与相关测试

											
										
										
											2026-03-20 16:36:42 +08:00
+								        for intent in getattr(st, "image_intents", None) or []:
 								            if getattr(intent, "intent_role", None) == "primary":
 								                aid = getattr(intent, "asset_id", None)
 								                if aid:
 								                    ids.add(str(aid))
-												重构回忆录为 story-first / markdown-first 架构并整合图片意图与前端 UI 修复

本次 squash merge 将 codex-story-first-image-intent 的整体改动合入 development，核心内容包括：

1. 后端数据与迁移：新增 stories、story_versions、story_image_intents、chapter_cover_intents、assets 等模型与 Alembic 迁移，建立 story-first、markdown-first、asset-first 的主数据链路。

2. 生成与任务链：引入 StoryBuilderOrchestrator、ChapterComposerOrchestrator、story_image_tasks、chapter_cover_tasks，图片生成从正文占位符改为结构化 intent -> asset -> markdown 回填。

3. 并发与一致性：为 story/chapter intent 增加 claim_token、claimed_at、attempt_count，采用数据库原子 claim 为主、Redis 锁为辅，避免重复生成、锁误删和 processing 卡死。

4. Memoir 读写路径：章节 canonical_markdown 成为正文真源，列表/详情接口补齐 markdown、cover_asset、word_count 等字段，PDF 与 asset 解析链路同步升级。

5. Memory / Retrieval：扩展 transcript ingest、chunking、evidence 检索与 story 聚合基础设施，为后续 story-first RAG 与多 agent 编排提供底座。

6. App 端体验：章节页继续走 MarkdownRenderer 阅读链，同时吸收 fix3-19 的跨平台 UI glitch 修复；更新对话页、首页、文案资源与章节列表映射逻辑。

7. 测试与文档：补充 asset resolver、story image task、章节封面派发、markdown 映射等回归测试，并加入图片占位符退役设计文档。

											
										
										
											2026-03-20 10:30:07 +08:00
+								    return ids
 								def collect_asset_ids_for_chapters(chapters: list) -> set[str]:
 								    combined: set[str] = set()
 								    for ch in chapters or []:
 								        combined |= collect_asset_ids_for_chapter(ch)
 								    return combined
 								def split_markdown_by_asset_refs(
 								    markdown: str,
 								    resolve_asset: Callable[[str], str | None],
 								) -> list[dict]:
 								    blocks: list[dict] = []
 								    refs = parse_asset_refs(markdown or "")
 								    if not refs:
 								        text = (markdown or "").strip()
 								        if text:
 								            blocks.append({"type": "text", "value": text})
 								        return blocks
 								    pos = 0
 								    for start, end, caption, asset_id in refs:
 								        if start > pos:
 								            text = markdown[pos:start].strip()
 								            if text:
 								                blocks.append({"type": "text", "value": text})
 								        url = resolve_asset(asset_id) if asset_id else None
 								        if url:
 								            blocks.append({"type": "image", "url": url, "caption": caption})
 								        pos = end
 								    if pos < len(markdown or ""):
 								        text = markdown[pos:].strip()
 								        if text:
 								            blocks.append({"type": "text", "value": text})
 								    return blocks
 								def resolve_asset_refs_in_markdown(
 								    markdown: str,
 								    resolve_asset: Callable[[str], str | None],
 								) -> str:
 								    if not markdown or not resolve_asset:
 								        return markdown or ""
 								    def repl(m):
 								        caption, asset_id = m.group(1) or "", m.group(2) or ""
 								        url = resolve_asset(asset_id) if asset_id else None
 								        if url:
 								            return f"![{caption}]({url})"
 								        return m.group(0)
 								    return _ASSET_REF_RE.sub(repl, markdown)