Files
life-echo/api/tests/test_classification_fragment.py
2026-03-23 13:54:41 +08:00

43 lines
1.4 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
"""ClassificationAgent零散档案启发式与分类 none 语义(纯函数/无 LLM"""
import pytest
from app.agents.memoir.classification_agent import (
ClassificationAgent,
_looks_like_fragment_only,
)
@pytest.mark.parametrize(
"text,expected_fragment",
[
("", True),
(" ", True),
("我1999年出生", True),
("1999年出生。", True),
("1999年出生", True),
("我是云南人", True),
("我是北京籍。", True),
("小学二年级那次下雨爷爷背我过河,鞋全湿了。", False),
("我出生在农村,家里养过一头黄牛。", False),
("我是北京人,后来去上海读了大学。", False),
],
)
def test_looks_like_fragment_only(text: str, expected_fragment: bool) -> None:
assert _looks_like_fragment_only(text) is expected_fragment
def test_classify_skips_story_for_birth_year_without_llm() -> None:
agent = ClassificationAgent()
assert agent.classify("1999年出生", fallback_stage="childhood", llm=None) is None
def test_classify_fallback_when_no_llm_and_narrative_snippet() -> None:
agent = ClassificationAgent()
out = agent.classify(
"小学二年级的时候我在操场上摔了一跤,膝盖流了很多血,是老师背我去医务室的。",
fallback_stage="childhood",
llm=None,
)
assert out == "education"