Files
life-echo/api/tests/test_json_and_memory_utils.py
Kevin 309a051038 feat: 回忆录证据血缘与内部评测可追溯,顺带对齐本地评测台与 CI
数据库与模型:新增多版迁移(章节证据快照、对话血缘、记忆事实/时间线 lineage 等),把「成稿 ↔ 对话/记忆」的溯源信息落到表结构里。
业务链路:会话与 WS、回忆录/故事流水线、记忆写入与 enrichment 等跟着接上线索与快照;新增章节证据快照与评测侧 EvalTraceService 等模块,方便组评审用的证据包。
内部评测:自动化 run 与手工 memoir 评审共用可追溯证据;rubric/ judge 相关脚本与文档有配套调整。
app-eval-web:Memoir/实验详情里能展开看证据摘要与 evidence_trace(含对话轮次 id);Vite 代理与 development.sh 注入的 API 端口与当前默认内部评测端口一致,避免改端口后页面连错服务。
工程杂项:GitHub Actions / 仓库说明有更新;各适配器与支付/配额/plan 等多处为小改动或跟随主改动的收尾;新增/扩充了?
2026-04-08 15:37:09 +08:00

113 lines
3.3 KiB
Python

"""JSON 载荷解析、证据格式化、Story 批量规划校验(纯函数)。"""
import pytest
from app.agents.chat.reply_limits import truncate_chat_segments
from app.agents.memoir.classification_agent import _normalize_llm_category
from app.agents.memoir.prompts import format_evidence_chunks_for_prompt
from app.features.memory.evidence_format import (
format_evidence_chunks_for_prompt as format_evidence_from_memory,
)
from app.agents.memoir.story_route_agent import (
StoryBatchPlan,
StoryBatchPlanUnit,
validate_story_batch_plan,
)
from app.core.json_utils import extract_json_payload
def test_extract_json_payload_strips_markdown_fence() -> None:
raw = """```json
{"a": 1}
```"""
assert '"a"' in extract_json_payload(raw)
def test_extract_json_payload_balanced_nested_braces() -> None:
raw = 'noise {"outer": {"inner": 1}} trailing'
assert extract_json_payload(raw) == '{"outer": {"inner": 1}}'
def test_normalize_llm_category_strips_quotes() -> None:
assert _normalize_llm_category('"childhood"') == "childhood"
assert _normalize_llm_category("`beliefs`") == "beliefs"
def test_format_evidence_chunks_includes_timeline() -> None:
ev = {
"relevant_chunks": [{"content": "chunk1"}],
"relevant_facts": [
{"subject": "", "predicate": "生于", "object_json": "1950"}
],
"timeline_hints": [
{
"id": "1",
"event_year": 1977,
"event_date": None,
"title": "恢复高考",
"description": "参加了考试",
}
],
"relevant_summaries": [],
"relevant_stories": [],
}
out = format_evidence_chunks_for_prompt(ev)
assert "chunk1" in out
assert "1950" in out or "生于" in out
assert "1977" in out or "恢复高考" in out
assert format_evidence_from_memory(ev) == out
def test_validate_story_batch_plan_ok() -> None:
ordered = ["s1", "s2"]
plan = StoryBatchPlan(
units=[
StoryBatchPlanUnit(
segment_ids=["s1", "s2"],
decision="new_story",
target_story_id=None,
new_story_title="标题",
reason=None,
)
]
)
ok, err = validate_story_batch_plan(ordered, plan, valid_story_ids=set())
assert ok is True
assert err is None
def test_truncate_chat_segments() -> None:
out = truncate_chat_segments(
["a" * 300, "b"],
max_segments=2,
max_chars_per_segment=220,
)
assert out[0] == "a" * 219 + ""
assert len(out[0]) == 220
assert out[1] == "b"
def test_validate_story_batch_plan_duplicate_segment() -> None:
plan = StoryBatchPlan(
units=[
StoryBatchPlanUnit(
segment_ids=["s1"],
decision="new_story",
target_story_id=None,
new_story_title="A",
reason=None,
),
StoryBatchPlanUnit(
segment_ids=["s1"],
decision="new_story",
target_story_id=None,
new_story_title="B",
reason=None,
),
]
)
ok, err = validate_story_batch_plan(["s1", "s1"], plan, valid_story_ids=set())
assert ok is False
assert err == "duplicate_segment"