Files
life-echo/api/tests/test_classification_fragment.py
Kevin e4bf0710c7 feat(memory,conversation): 记忆富化/证据包、时间线幂等字段与对话分段全链路
数据库
- 新增迁移 0003:timeline_events.memory_source_id 外键 → memory_sources,便于按 ingest 源做时间线幂等

后端 - 记忆
- 新增 ingest 后 LLM 富化(摘要/事实/时间线),可配置开关与最大字符数
- 新增证据包组装:合并 chunk、摘要、事实、时间线、故事等检索结果;支持空 query 时是否仍带 rolling 等开关
- repo/retriever/service/router/schemas/summarizer/timeline/extractor 等扩展;文档 memory-retrieval.md 更新

后端 - 对话 WS
- 增加 PING/PONG;分段 ASR 日志与空音频处理;转写失败与「无助手回复」错误提示更明确
- 助手多段回复持久化使用统一分隔符,与分段逻辑一致

后端 - Agent
- reply_limits:按 [SPLIT] 与段落拆段,并保证非空 fallback,供 WS 与 TTS 多段下发

后端 - 回忆录任务
- transcript ingest 记录 source_id;任务成功结?
2026-03-27 16:24:43 +08:00

59 lines
1.8 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
"""ClassificationAgent零散档案启发式与 none→summary 兜底(纯函数/无 LLM"""
import pytest
from app.agents.memoir.classification_agent import (
ClassificationAgent,
_looks_like_fragment_only,
_parse_category_from_llm_response,
)
@pytest.mark.parametrize(
"text,expected_fragment",
[
("", True),
(" ", True),
("我1999年出生", True),
("1999年出生。", True),
("1999年出生", True),
("我是云南人", True),
("我是北京籍。", True),
("小学二年级那次下雨爷爷背我过河,鞋全湿了。", False),
("我出生在农村,家里养过一头黄牛。", False),
("我是北京人,后来去上海读了大学。", False),
],
)
def test_looks_like_fragment_only(text: str, expected_fragment: bool) -> None:
assert _looks_like_fragment_only(text) is expected_fragment
def test_classify_maps_birth_year_fragment_to_summary_without_llm() -> None:
agent = ClassificationAgent()
assert (
agent.classify("1999年出生", fallback_stage="childhood", llm=None) == "summary"
)
@pytest.mark.parametrize(
"raw,expected",
[
('{"category": "childhood"}', "childhood"),
('```json\n{"category": "none"}\n```', "none"),
("childhood", "childhood"),
('"education"', "education"),
],
)
def test_parse_category_from_llm_response(raw: str, expected: str) -> None:
assert _parse_category_from_llm_response(raw) == expected
def test_classify_fallback_when_no_llm_and_narrative_snippet() -> None:
agent = ClassificationAgent()
out = agent.classify(
"小学二年级的时候我在操场上摔了一跤,膝盖流了很多血,是老师背我去医务室的。",
fallback_stage="childhood",
llm=None,
)
assert out == "education"