43 lines
1.4 KiB
Python
43 lines
1.4 KiB
Python
|
|
"""ClassificationAgent:零散档案启发式与分类 none 语义(纯函数/无 LLM)。"""
|
|||
|
|
|
|||
|
|
import pytest
|
|||
|
|
|
|||
|
|
from app.agents.memoir.classification_agent import (
|
|||
|
|
ClassificationAgent,
|
|||
|
|
_looks_like_fragment_only,
|
|||
|
|
)
|
|||
|
|
|
|||
|
|
|
|||
|
|
@pytest.mark.parametrize(
|
|||
|
|
"text,expected_fragment",
|
|||
|
|
[
|
|||
|
|
("", True),
|
|||
|
|
(" ", True),
|
|||
|
|
("我1999年出生", True),
|
|||
|
|
("1999年出生。", True),
|
|||
|
|
("1999年出生!", True),
|
|||
|
|
("我是云南人", True),
|
|||
|
|
("我是北京籍。", True),
|
|||
|
|
("小学二年级那次下雨爷爷背我过河,鞋全湿了。", False),
|
|||
|
|
("我出生在农村,家里养过一头黄牛。", False),
|
|||
|
|
("我是北京人,后来去上海读了大学。", False),
|
|||
|
|
],
|
|||
|
|
)
|
|||
|
|
def test_looks_like_fragment_only(text: str, expected_fragment: bool) -> None:
|
|||
|
|
assert _looks_like_fragment_only(text) is expected_fragment
|
|||
|
|
|
|||
|
|
|
|||
|
|
def test_classify_skips_story_for_birth_year_without_llm() -> None:
|
|||
|
|
agent = ClassificationAgent()
|
|||
|
|
assert agent.classify("1999年出生", fallback_stage="childhood", llm=None) is None
|
|||
|
|
|
|||
|
|
|
|||
|
|
def test_classify_fallback_when_no_llm_and_narrative_snippet() -> None:
|
|||
|
|
agent = ClassificationAgent()
|
|||
|
|
out = agent.classify(
|
|||
|
|
"小学二年级的时候我在操场上摔了一跤,膝盖流了很多血,是老师背我去医务室的。",
|
|||
|
|
fallback_stage="childhood",
|
|||
|
|
llm=None,
|
|||
|
|
)
|
|||
|
|
assert out == "education"
|