feat(evaluation): memoir readiness, judge/replay updates, eval web playground
Add memoir_readiness_service and router tests; extend judge schemas/services, replay_service, and conversation rubric; align story route agent, payload, prompts, and story_pipeline_sync; update agent logging, config, and DI. Document internal-eval; add replayDraft util and PlaygroundPage changes in app-eval-web.
This commit is contained in:
94
api/tests/evaluation/test_memoir_readiness_router.py
Normal file
94
api/tests/evaluation/test_memoir_readiness_router.py
Normal file
@@ -0,0 +1,94 @@
|
||||
"""memoir-phase1-ready internal 路由(依赖注入替身)。"""
|
||||
|
||||
import pytest
|
||||
from httpx import ASGITransport, AsyncClient
|
||||
|
||||
from app.features.evaluation.internal_auth import get_internal_eval_principal
|
||||
from app.features.evaluation.schemas import MemoirPhase1ReadyOut
|
||||
|
||||
|
||||
@pytest.mark.asyncio
|
||||
async def test_memoir_phase1_ready_returns_bundle(monkeypatch: pytest.MonkeyPatch) -> None:
|
||||
from fastapi import FastAPI
|
||||
|
||||
monkeypatch.setattr(
|
||||
"app.core.config.settings.internal_eval_api_key",
|
||||
"secret",
|
||||
raising=False,
|
||||
)
|
||||
from app.features.evaluation.deps import get_memoir_readiness_service
|
||||
from app.features.evaluation.router import router
|
||||
|
||||
class _Fake:
|
||||
async def memoir_phase1_ready_for_segments(
|
||||
self, *, conversation_id: str, segment_ids: list[str]
|
||||
) -> MemoirPhase1ReadyOut:
|
||||
return MemoirPhase1ReadyOut(
|
||||
ready=True,
|
||||
checked_segment_ids=list(segment_ids),
|
||||
pending_segment_ids=[],
|
||||
)
|
||||
|
||||
app = FastAPI()
|
||||
app.include_router(router, prefix="/internal/api/evaluation")
|
||||
|
||||
async def _override_auth():
|
||||
from app.features.evaluation.internal_auth import InternalEvalPrincipal
|
||||
|
||||
return InternalEvalPrincipal()
|
||||
|
||||
app.dependency_overrides[get_internal_eval_principal] = _override_auth
|
||||
app.dependency_overrides[get_memoir_readiness_service] = lambda: _Fake()
|
||||
|
||||
transport = ASGITransport(app=app)
|
||||
async with AsyncClient(transport=transport, base_url="http://t") as client:
|
||||
r = await client.get(
|
||||
"/internal/api/evaluation/sessions/cid-a/memoir-phase1-ready",
|
||||
headers={"X-Internal-Eval-Key": "secret"},
|
||||
params=[("segment_ids", "s1"), ("segment_ids", "s2")],
|
||||
)
|
||||
assert r.status_code == 200
|
||||
body = r.json()
|
||||
assert body["ready"] is True
|
||||
assert body["checked_segment_ids"] == ["s1", "s2"]
|
||||
assert body["pending_segment_ids"] == []
|
||||
|
||||
|
||||
@pytest.mark.asyncio
|
||||
async def test_memoir_phase1_ready_404_propagates(monkeypatch: pytest.MonkeyPatch) -> None:
|
||||
from fastapi import FastAPI
|
||||
|
||||
monkeypatch.setattr(
|
||||
"app.core.config.settings.internal_eval_api_key",
|
||||
"secret",
|
||||
raising=False,
|
||||
)
|
||||
from app.features.evaluation.deps import get_memoir_readiness_service
|
||||
from app.features.evaluation.errors import EvaluationNotFoundError
|
||||
from app.features.evaluation.router import router
|
||||
|
||||
class _Fake:
|
||||
async def memoir_phase1_ready_for_segments(
|
||||
self, *, conversation_id: str, segment_ids: list[str]
|
||||
) -> MemoirPhase1ReadyOut:
|
||||
raise EvaluationNotFoundError("conversation not found")
|
||||
|
||||
app = FastAPI()
|
||||
app.include_router(router, prefix="/internal/api/evaluation")
|
||||
|
||||
async def _override_auth():
|
||||
from app.features.evaluation.internal_auth import InternalEvalPrincipal
|
||||
|
||||
return InternalEvalPrincipal()
|
||||
|
||||
app.dependency_overrides[get_internal_eval_principal] = _override_auth
|
||||
app.dependency_overrides[get_memoir_readiness_service] = lambda: _Fake()
|
||||
|
||||
transport = ASGITransport(app=app)
|
||||
async with AsyncClient(transport=transport, base_url="http://t") as client:
|
||||
r = await client.get(
|
||||
"/internal/api/evaluation/sessions/missing/memoir-phase1-ready",
|
||||
headers={"X-Internal-Eval-Key": "secret"},
|
||||
params=[("segment_ids", "s1")],
|
||||
)
|
||||
assert r.status_code == 404
|
||||
Reference in New Issue
Block a user