Files
life-echo/api/app/features/memoir/memoir_images/schema.py

158 lines
5.4 KiB
Python
Raw Normal View History

import re
from typing import Any
IMAGE_STATUS_PENDING = "pending"
IMAGE_STATUS_PROCESSING = "processing"
IMAGE_STATUS_COMPLETED = "completed"
IMAGE_STATUS_FAILED = "failed"
VALID_IMAGE_STATUSES = {
IMAGE_STATUS_PENDING,
IMAGE_STATUS_PROCESSING,
IMAGE_STATUS_COMPLETED,
IMAGE_STATUS_FAILED,
}
2026-03-19 14:36:14 +08:00
_PLACEHOLDER_DESCRIPTION_RE = re.compile(
r"\{\{\{\{IMAGE:(.*?)\}\}\}\}|\{\{IMAGE:(.*?)\}\}"
)
def normalize_image_asset(asset: dict[str, Any] | None) -> dict[str, Any] | None:
2026-03-20 15:15:35 +08:00
"""归一化单条图片 dict。
refactor(api,expo): 多智能体与会话收敛、回忆录兼容层移除、后端测试集大幅删减 - 对齐「多智能体收敛」与「回忆录 stories-first / markdown-first」方向:收紧运行时契约、 删除过渡兼容路径与双轨逻辑,并同步更新客户端与文档。 - Chat:以 ChatOrchestrator 为实时编排入口;删除独立 conversation_agent,精简 prompts。 - Memoir:删除 memory_agent;MemoirOrchestrator、classification / story_route 与 prompts 收敛到 prepare_batches + run_story_pipeline_for_category_batch 主链路。 - 将 agents 侧 processor 迁入 feature 层为 background_runner,并移除 features 下重复/过时 processor 封装。 - 新增 history_store,强化「conversation_messages 为 DB 真源、Redis 为缓存」模型。 - 调整 models、repo、service、session_history;精简 WS message_types,重构 pipeline 与 router。 - 移除章节占位、整章再生等旧路径;章节列表与封面逻辑要求 story 关联;收紧 cover 资格与 enqueue。 - helpers、repo、service、router、reading_segment_materialize、story_pipeline_sync、pdf_service 等按 canonical markdown / cover_asset_id 收缩;删除 memoir_images/provider 等冗余。 - tasks:memoir_tasks、chapter_cover_tasks 等大幅瘦身;story_image_tasks 等与当前图片任务对齐。 - core:config、logging、redis、task_tracker 小幅调整。 - auth / user / payment / quota:路由或服务侧删减过时接口或逻辑(如 payment router 行数减少)。 - pyproject.toml、development.sh、.env.example / .env.production、README 等同步说明或变量。 - Alembic 0001_initial_schema 微调(与当前 schema 叙事一致的小改动)。 - 回忆录:types / mappers / api、章节页与 memoir 页与后端契约对齐;markdown-renderer 调整。 - 语音:删除 voice/player,voice-segment-store 相应精简。 - api/tests:删除 conftest 及绝大部分既有测试文件(websocket_baseline、conversation、memoir 图片、PDF、SMS 等),属有意收缩/待按 backend-test-system 重建的信号。 - docs:新增多智能体收敛与移除兼容层计划摘要;更新 story-first 设计、backend-test-system、 multi-agent-refactor-plan、实施总结等。 BREAKING CHANGE: 后端对外契约、回忆录章节字段与若干路由/任务行为已变更;大量 API 测试被移除, CI 若依赖这些用例需按新策略补测或调整流水线。
2026-03-22 16:45:57 +08:00
- 可解析 {{{{IMAGE:}}}} / {{IMAGE:}} 占位符中的 description
- 插图不嵌入 markdown 时可无占位符已完成且带 url/storage_key 即可通过
2026-03-20 15:15:35 +08:00
description 缺省时用插图pending/processing 至少要有 description占位符或 prompt
"""
if not isinstance(asset, dict):
return None
2026-03-20 15:15:35 +08:00
ph_in = _as_non_empty_string(asset.get("placeholder"))
desc_in = _as_non_empty_string(asset.get("description"))
desc_from_ph = _extract_description_from_placeholder(ph_in) if ph_in else None
merged_description = desc_in or desc_from_ph
prompt_s = _as_non_empty_string(asset.get("prompt"))
error_s = _as_optional_string(asset.get("error"))
url_s = _as_optional_string(asset.get("url"))
storage_key_s = _as_optional_string(asset.get("storage_key"))
has_url_or_key = bool(url_s or storage_key_s)
status = _as_non_empty_string(asset.get("status")) or IMAGE_STATUS_PENDING
if ph_in and merged_description:
placeholder_out = ph_in
description_out = merged_description
elif status == IMAGE_STATUS_COMPLETED and has_url_or_key:
placeholder_out = ph_in or ""
description_out = merged_description or "插图"
elif status in (IMAGE_STATUS_PENDING, IMAGE_STATUS_PROCESSING):
if not (merged_description or ph_in or prompt_s):
return None
placeholder_out = ph_in or ""
description_out = merged_description or prompt_s or "插图"
elif status == IMAGE_STATUS_FAILED:
if not (merged_description or ph_in or error_s):
return None
placeholder_out = ph_in or ""
description_out = merged_description or "插图"
else:
return None
normalized = dict(asset)
normalized["index"] = _coerce_int(asset.get("index"), default=0)
2026-03-20 15:15:35 +08:00
normalized["placeholder"] = placeholder_out
normalized["description"] = description_out
if status not in VALID_IMAGE_STATUSES:
normalized["status"] = IMAGE_STATUS_FAILED
normalized["error"] = asset.get("error") or f"invalid image status: {status}"
return normalized
normalized["status"] = status
normalized["prompt"] = _as_optional_string(asset.get("prompt"))
normalized["url"] = _as_optional_string(asset.get("url"))
normalized["storage_key"] = _as_optional_string(asset.get("storage_key"))
normalized["provider"] = _as_optional_string(asset.get("provider"))
normalized["style"] = _as_optional_string(asset.get("style"))
normalized["size"] = _as_optional_string(asset.get("size"))
normalized["error"] = _as_optional_string(asset.get("error"))
normalized["created_at"] = _as_optional_string(asset.get("created_at"))
normalized["updated_at"] = _as_optional_string(asset.get("updated_at"))
normalized["retryable"] = _as_optional_bool(asset.get("retryable"))
if normalized["status"] == IMAGE_STATUS_COMPLETED and not (
normalized["url"] or normalized["storage_key"]
):
normalized["status"] = IMAGE_STATUS_FAILED
normalized["error"] = normalized["error"] or "missing image url"
if normalized["status"] != IMAGE_STATUS_FAILED:
normalized["retryable"] = None
return normalized
def normalize_image_assets(images: list[dict[str, Any]] | None) -> list[dict[str, Any]]:
normalized_assets: list[dict[str, Any]] = []
for item in images or []:
normalized = normalize_image_asset(item)
if normalized:
normalized_assets.append(normalized)
return normalized_assets
def completed_image_assets(images: list[dict[str, Any]] | None) -> list[dict[str, Any]]:
return [
asset
for asset in normalize_image_assets(images)
if asset.get("status") == IMAGE_STATUS_COMPLETED
and (asset.get("storage_key") or asset.get("url"))
]
def _as_non_empty_string(value: Any) -> str | None:
if isinstance(value, str):
stripped = value.strip()
return stripped or None
return None
def _as_optional_string(value: Any) -> str | None:
if value is None:
return None
if isinstance(value, str):
return value
return str(value)
def _as_optional_bool(value: Any) -> bool | None:
if value is None:
return None
if isinstance(value, bool):
return value
if isinstance(value, str):
lowered = value.strip().lower()
if lowered in {"true", "1", "yes"}:
return True
if lowered in {"false", "0", "no"}:
return False
return None
def _coerce_int(value: Any, default: int) -> int:
try:
return int(value)
except (TypeError, ValueError):
return default
def _extract_description_from_placeholder(placeholder: str | None) -> str | None:
if not placeholder:
return None
match = _PLACEHOLDER_DESCRIPTION_RE.fullmatch(placeholder.strip())
if not match:
return None
description = (match.group(1) or match.group(2) or "").strip()
return description or None