api/app/agents/memoir/batch_phase1_prep.py

"""
Phase1 批处理：一次 LLM 调用完成多段的抽取 + 章节分类（与逐段循环语义对齐）。
"""

from __future__ import annotations

import math
from dataclasses import dataclass
from typing import Any, Callable, Dict, List

from app.agents.memoir.prompts import get_batch_memoir_phase1_prep_prompt
from app.agents.memoir.schemas import BatchPhase1LLMOutput
from app.agents.stage_constants import STAGE_SLOT_KEYS
from app.agents.state_schema import MemoirStateSchema
from app.core.config import settings
from app.core.llm_call import LLMCallError, llm_json_call
from app.core.logging import get_logger
from app.features.conversation.models import Segment

logger = get_logger(__name__)

STAGE_ALLOWED_SLOTS: Dict[str, frozenset[str]] = {
    k: frozenset(v) for k, v in STAGE_SLOT_KEYS.items()
}


def _slots_snapshot(state: MemoirStateSchema) -> dict:
    snap: dict = {}
    for stage, buckets in (state.slots or {}).items():
        snap[stage] = {}
        for k, v in (buckets or {}).items():
            if hasattr(v, "snippet"):
                sn = getattr(v, "snippet", None) or ""
            elif isinstance(v, dict):
                sn = (
                    (v.get("snippet") or "")
                    if isinstance(v.get("snippet"), str)
                    else ""
                )
            else:
                sn = ""
            snap[stage][k] = (sn or "")[:120]
    return snap


@dataclass(frozen=True)
class BatchPhase1SegmentRow:
    detected_stage: str
    slots: Dict[str, str]
    chapter_category_raw: str


def run_batch_phase1_prep(
    segments: List[Segment],
    state: MemoirStateSchema,
    llm: Any,
) -> Dict[str, BatchPhase1SegmentRow]:
    """对 segments 顺序批量调用 LLM；返回 id → 行。id 集合必须与入参完全一致。"""
    if not llm:
        raise ValueError("batch phase1 requires llm")
    if not segments:
        return {}
    items = [(str(s.id), (s.user_input_text or "").strip()) for s in segments]
    prompt = get_batch_memoir_phase1_prep_prompt(
        system_current_stage=state.current_stage or "childhood",
        slots_snapshot=_slots_snapshot(state),
        segment_items=items,
    )
    try:
        parsed = llm_json_call(
            llm,
            prompt,
            BatchPhase1LLMOutput,
            max_tokens=int(settings.memoir_phase1_batch_llm_max_tokens),
            agent="BatchPhase1Prep.run",
        )
    except LLMCallError as e:
        logger.warning("batch phase1 LLM 解析失败: {}", e)
        raise ValueError("batch phase1: llm parse failed") from e

    rows = parsed.segments
    if not rows:
        raise ValueError("batch phase1: segments must be a non-empty list")

    by_id: Dict[str, BatchPhase1SegmentRow] = {}
    for row in rows:
        sid = str(row.id).strip()
        if not sid:
            continue
        ds = str(row.detected_stage or "").strip().lower()
        slots_raw = row.slots or {}
        slots = {
            k: v if isinstance(v, str) else str(v)
            for k, v in slots_raw.items()
            if k and isinstance(k, str)
        }
        cat_raw = str(row.chapter_category or "")
        by_id[sid] = BatchPhase1SegmentRow(
            detected_stage=ds or (state.current_stage or "childhood"),
            slots=slots,
            chapter_category_raw=cat_raw,
        )

    expected = {str(s.id) for s in segments}
    if by_id.keys() != expected:
        missing = expected - by_id.keys()
        extra = by_id.keys() - expected
        logger.warning("batch phase1 id mismatch missing={} extra={}", missing, extra)
        raise ValueError("batch phase1 response segment ids do not match input")
    return by_id


def _run_batch_phase1_prep_chunk_with_bisect(
    segments: List[Segment],
    state: MemoirStateSchema,
    llm: Any,
) -> Dict[str, BatchPhase1SegmentRow]:
    """单块 LLM；失败时（如输出截断）将块二等分重试直至单段。"""
    try:
        return run_batch_phase1_prep(segments, state, llm)
    except ValueError:
        if len(segments) <= 1:
            raise
        mid = len(segments) // 2
        if mid < 1:
            raise
        left = _run_batch_phase1_prep_chunk_with_bisect(segments[:mid], state, llm)
        right = _run_batch_phase1_prep_chunk_with_bisect(segments[mid:], state, llm)
        merged = {**left, **right}
        expected = {str(s.id) for s in segments}
        if merged.keys() != expected:
            raise ValueError(
                "batch phase1 chunked bisect merge: segment ids do not match input"
            ) from None
        return merged


def run_batch_phase1_prep_chunked(
    segments: List[Segment],
    state: MemoirStateSchema,
    llm: Any,
    *,
    chunk_size: int,
    on_chunk: Callable[[int, int], None] | None = None,
) -> Dict[str, BatchPhase1SegmentRow]:
    """
    将 segments 按 chunk_size 切片多次调用 Phase1 批处理 LLM，合并 by_id。
    单块仍失败时在块内二分回退（最后回退到单段），与 orchestrator 外层逐段回退衔接。
    """
    if not segments:
        return {}
    if chunk_size < 1:
        chunk_size = 1
    n = len(segments)
    total_chunks = max(1, math.ceil(n / chunk_size))
    merged: Dict[str, BatchPhase1SegmentRow] = {}
    for i in range(0, n, chunk_size):
        chunk_idx = i // chunk_size + 1
        sub = segments[i : i + chunk_size]
        logger.info(
            "event=batch_phase1_chunk chunk_idx={}/{} segment_count={} batch_path=chunked "
            "msg=Phase1 批处理分块调用",
            chunk_idx,
            total_chunks,
            len(sub),
        )
        part = _run_batch_phase1_prep_chunk_with_bisect(sub, state, llm)
        merged.update(part)
        if on_chunk is not None:
            on_chunk(chunk_idx, total_chunks)
    expected = {str(s.id) for s in segments}
    if merged.keys() != expected:
        missing = expected - merged.keys()
        extra = merged.keys() - expected
        logger.warning(
            "batch phase1 chunked id mismatch missing={} extra={}",
            missing,
            extra,
        )
        raise ValueError("batch phase1 chunked: merged segment ids do not match input")
    return merged
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								"""
 								Phase1 批处理：一次 LLM 调用完成多段的抽取 + 章节分类（与逐段循环语义对齐）。
 								"""
 								from __future__ import annotations
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								import math
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								from dataclasses import dataclass
-												feat(eval): memoir A/B chapter judging and eval-web parity with dialogue

- Judge baseline excerpt and library chapter separately; build_memoir_compare_summary for gate, nine-dim and leaf deltas.

- Memoir SSE chapter payload: baseline_judge, compare_summary, baseline_judge_error.

- MemoirJudgeOutput: loose score coercion and post-validate clamp; memoir judge prompt caps from settings.

- app-eval-web: two-column MemoirScoreCard layout, MemoirCompareSummary, chapter blocks and CSS.

- Add memoir_compare_summary, log_events, celery_log_context, memoir_pipeline_progress; tests and migration 0014.

- Misc: memory/evidence and enrichment paths, task/orchestrator updates, internal-eval docs, env examples.

											
										
										
											2026-04-10 10:23:43 +08:00
+								from typing import Any, Callable, Dict, List
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
 								from app.agents.memoir.prompts import get_batch_memoir_phase1_prep_prompt
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								from app.agents.memoir.schemas import BatchPhase1LLMOutput
 								from app.agents.stage_constants import STAGE_SLOT_KEYS
-												feat: 回忆录证据血缘与内部评测可追溯，顺带对齐本地评测台与 CI

数据库与模型：新增多版迁移（章节证据快照、对话血缘、记忆事实/时间线 lineage 等），把「成稿 ↔ 对话/记忆」的溯源信息落到表结构里。
业务链路：会话与 WS、回忆录/故事流水线、记忆写入与 enrichment 等跟着接上线索与快照；新增章节证据快照与评测侧 EvalTraceService 等模块，方便组评审用的证据包。
内部评测：自动化 run 与手工 memoir 评审共用可追溯证据；rubric/ judge 相关脚本与文档有配套调整。
app-eval-web：Memoir/实验详情里能展开看证据摘要与 evidence_trace（含对话轮次 id）；Vite 代理与 development.sh 注入的 API 端口与当前默认内部评测端口一致，避免改端口后页面连错服务。
工程杂项：GitHub Actions / 仓库说明有更新；各适配器与支付/配额/plan 等多处为小改动或跟随主改动的收尾；新增/扩充了?

											
										
										
											2026-04-08 15:37:09 +08:00
+								from app.agents.state_schema import MemoirStateSchema
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								from app.core.config import settings
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								from app.core.llm_call import LLMCallError, llm_json_call
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								from app.core.logging import get_logger
 								from app.features.conversation.models import Segment
 								logger = get_logger(__name__)
 								STAGE_ALLOWED_SLOTS: Dict[str, frozenset[str]] = {
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								    k: frozenset(v) for k, v in STAGE_SLOT_KEYS.items()
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								}
 								def _slots_snapshot(state: MemoirStateSchema) -> dict:
 								    snap: dict = {}
 								    for stage, buckets in (state.slots or {}).items():
 								        snap[stage] = {}
 								        for k, v in (buckets or {}).items():
 								            if hasattr(v, "snippet"):
 								                sn = getattr(v, "snippet", None) or ""
 								            elif isinstance(v, dict):
 								                sn = (
 								                    (v.get("snippet") or "")
 								                    if isinstance(v.get("snippet"), str)
 								                    else ""
 								                )
 								            else:
 								                sn = ""
 								            snap[stage][k] = (sn or "")[:120]
 								    return snap
 								@dataclass(frozen=True)
 								class BatchPhase1SegmentRow:
 								    detected_stage: str
 								    slots: Dict[str, str]
 								    chapter_category_raw: str
 								def run_batch_phase1_prep(
 								    segments: List[Segment],
 								    state: MemoirStateSchema,
 								    llm: Any,
 								) -> Dict[str, BatchPhase1SegmentRow]:
 								    """对 segments 顺序批量调用 LLM；返回 id → 行。id 集合必须与入参完全一致。"""
 								    if not llm:
 								        raise ValueError("batch phase1 requires llm")
 								    if not segments:
 								        return {}
 								    items = [(str(s.id), (s.user_input_text or "").strip()) for s in segments]
 								    prompt = get_batch_memoir_phase1_prep_prompt(
 								        system_current_stage=state.current_stage or "childhood",
 								        slots_snapshot=_slots_snapshot(state),
 								        segment_items=items,
 								    )
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								    try:
 								        parsed = llm_json_call(
 								            llm,
 								            prompt,
 								            BatchPhase1LLMOutput,
 								            max_tokens=int(settings.memoir_phase1_batch_llm_max_tokens),
 								            agent="BatchPhase1Prep.run",
 								        )
 								    except LLMCallError as e:
 								        logger.warning("batch phase1 LLM 解析失败: {}", e)
 								        raise ValueError("batch phase1: llm parse failed") from e
 								    rows = parsed.segments
 								    if not rows:
 								        raise ValueError("batch phase1: segments must be a non-empty list")
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
 								    by_id: Dict[str, BatchPhase1SegmentRow] = {}
 								    for row in rows:
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								        sid = str(row.id).strip()
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								        if not sid:
 								            continue
-												feat(api): 统一 LLM JSON 调用层 llm_json_call，按域 Schema 迁移 chat/memoir agents

											
										
										
											2026-04-03 13:34:27 +08:00
+								        ds = str(row.detected_stage or "").strip().lower()
 								        slots_raw = row.slots or {}
 								        slots = {
 								            k: v if isinstance(v, str) else str(v)
 								            for k, v in slots_raw.items()
 								            if k and isinstance(k, str)
 								        }
 								        cat_raw = str(row.chapter_category or "")
-												feat(api): 访谈路径轻量门控、Memoir Phase1 批处理与叙事/记忆管线加固

- 新增 utterance_substance：短时/应答/元话语可跳过记忆检索、阶段 LLM 与资料抽取 LLM；可配置
- 输入归一化：LLM 模式默认仅语音/ASR；配置项写入 .env.example
- Memoir Phase1：可选 batch LLM 一次性抽取+分类（失败回退逐段）；Extraction 空槽位时阶段与 current_stage 对齐，prompt 约束收紧
- 叙事与忠实度：narrative_safety、证据重叠/场合锚点、标题 slots 与履历短语 grounded；fidelity 解析失败 fail-open 可配置
- 章节管线：锁 TTL 上调、锁竞争 Celery 重试、Phase2 immediate singleflight 等；story_pipeline_sync / chapter_compose / memoir_tasks 联动
- Memory：compaction / repo / summarizer / evidence 小修；事实 FTS 未命中是否回退最近事实可配置
- 新增 memoir_pipeline_trace；补充 memoir_reliability 文档与多项回归/门控测试

											
										
										
											2026-04-03 10:12:59 +08:00
+								        by_id[sid] = BatchPhase1SegmentRow(
 								            detected_stage=ds or (state.current_stage or "childhood"),
 								            slots=slots,
 								            chapter_category_raw=cat_raw,
 								        )
 								    expected = {str(s.id) for s in segments}
 								    if by_id.keys() != expected:
 								        missing = expected - by_id.keys()
 								        extra = by_id.keys() - expected
 								        logger.warning("batch phase1 id mismatch missing={} extra={}", missing, extra)
 								        raise ValueError("batch phase1 response segment ids do not match input")
 								    return by_id
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
 								def _run_batch_phase1_prep_chunk_with_bisect(
 								    segments: List[Segment],
 								    state: MemoirStateSchema,
 								    llm: Any,
 								) -> Dict[str, BatchPhase1SegmentRow]:
 								    """单块 LLM；失败时（如输出截断）将块二等分重试直至单段。"""
 								    try:
 								        return run_batch_phase1_prep(segments, state, llm)
 								    except ValueError:
 								        if len(segments) <= 1:
 								            raise
 								        mid = len(segments) // 2
 								        if mid < 1:
 								            raise
-												fix:
1. 修复登录界面文字被遮挡问题
2. 大字模式关闭后显示异常问题
3. 重新调整大字模式是否开启时的字体显示效果

											
										
										
											2026-04-10 20:35:57 +08:00
+								        left = _run_batch_phase1_prep_chunk_with_bisect(segments[:mid], state, llm)
 								        right = _run_batch_phase1_prep_chunk_with_bisect(segments[mid:], state, llm)
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								        merged = {**left, **right}
 								        expected = {str(s.id) for s in segments}
 								        if merged.keys() != expected:
 								            raise ValueError(
 								                "batch phase1 chunked bisect merge: segment ids do not match input"
-												feat(eval): memoir A/B chapter judging and eval-web parity with dialogue

- Judge baseline excerpt and library chapter separately; build_memoir_compare_summary for gate, nine-dim and leaf deltas.

- Memoir SSE chapter payload: baseline_judge, compare_summary, baseline_judge_error.

- MemoirJudgeOutput: loose score coercion and post-validate clamp; memoir judge prompt caps from settings.

- app-eval-web: two-column MemoirScoreCard layout, MemoirCompareSummary, chapter blocks and CSS.

- Add memoir_compare_summary, log_events, celery_log_context, memoir_pipeline_progress; tests and migration 0014.

- Misc: memory/evidence and enrichment paths, task/orchestrator updates, internal-eval docs, env examples.

											
										
										
											2026-04-10 10:23:43 +08:00
+								            ) from None
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								        return merged
 								def run_batch_phase1_prep_chunked(
 								    segments: List[Segment],
 								    state: MemoirStateSchema,
 								    llm: Any,
 								    *,
 								    chunk_size: int,
-												feat(eval): memoir A/B chapter judging and eval-web parity with dialogue

- Judge baseline excerpt and library chapter separately; build_memoir_compare_summary for gate, nine-dim and leaf deltas.

- Memoir SSE chapter payload: baseline_judge, compare_summary, baseline_judge_error.

- MemoirJudgeOutput: loose score coercion and post-validate clamp; memoir judge prompt caps from settings.

- app-eval-web: two-column MemoirScoreCard layout, MemoirCompareSummary, chapter blocks and CSS.

- Add memoir_compare_summary, log_events, celery_log_context, memoir_pipeline_progress; tests and migration 0014.

- Misc: memory/evidence and enrichment paths, task/orchestrator updates, internal-eval docs, env examples.

											
										
										
											2026-04-10 10:23:43 +08:00
+								    on_chunk: Callable[[int, int], None] | None = None,
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								) -> Dict[str, BatchPhase1SegmentRow]:
 								    """
 								    将 segments 按 chunk_size 切片多次调用 Phase1 批处理 LLM，合并 by_id。
 								    单块仍失败时在块内二分回退（最后回退到单段），与 orchestrator 外层逐段回退衔接。
 								    """
 								    if not segments:
 								        return {}
 								    if chunk_size < 1:
 								        chunk_size = 1
 								    n = len(segments)
 								    total_chunks = max(1, math.ceil(n / chunk_size))
 								    merged: Dict[str, BatchPhase1SegmentRow] = {}
 								    for i in range(0, n, chunk_size):
 								        chunk_idx = i // chunk_size + 1
 								        sub = segments[i : i + chunk_size]
 								        logger.info(
-												feat(eval): memoir A/B chapter judging and eval-web parity with dialogue

- Judge baseline excerpt and library chapter separately; build_memoir_compare_summary for gate, nine-dim and leaf deltas.

- Memoir SSE chapter payload: baseline_judge, compare_summary, baseline_judge_error.

- MemoirJudgeOutput: loose score coercion and post-validate clamp; memoir judge prompt caps from settings.

- app-eval-web: two-column MemoirScoreCard layout, MemoirCompareSummary, chapter blocks and CSS.

- Add memoir_compare_summary, log_events, celery_log_context, memoir_pipeline_progress; tests and migration 0014.

- Misc: memory/evidence and enrichment paths, task/orchestrator updates, internal-eval docs, env examples.

											
										
										
											2026-04-10 10:23:43 +08:00
+								            "event=batch_phase1_chunk chunk_idx={}/{} segment_count={} batch_path=chunked "
 								            "msg=Phase1 批处理分块调用",
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								            chunk_idx,
 								            total_chunks,
 								            len(sub),
 								        )
 								        part = _run_batch_phase1_prep_chunk_with_bisect(sub, state, llm)
 								        merged.update(part)
-												feat(eval): memoir A/B chapter judging and eval-web parity with dialogue

- Judge baseline excerpt and library chapter separately; build_memoir_compare_summary for gate, nine-dim and leaf deltas.

- Memoir SSE chapter payload: baseline_judge, compare_summary, baseline_judge_error.

- MemoirJudgeOutput: loose score coercion and post-validate clamp; memoir judge prompt caps from settings.

- app-eval-web: two-column MemoirScoreCard layout, MemoirCompareSummary, chapter blocks and CSS.

- Add memoir_compare_summary, log_events, celery_log_context, memoir_pipeline_progress; tests and migration 0014.

- Misc: memory/evidence and enrichment paths, task/orchestrator updates, internal-eval docs, env examples.

											
										
										
											2026-04-10 10:23:43 +08:00
+								        if on_chunk is not None:
 								            on_chunk(chunk_idx, total_chunks)
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								    expected = {str(s.id) for s in segments}
 								    if merged.keys() != expected:
 								        missing = expected - merged.keys()
 								        extra = merged.keys() - expected
 								        logger.warning(
 								            "batch phase1 chunked id mismatch missing={} extra={}",
 								            missing,
 								            extra,
 								        )
-												fix:
1. 修复登录界面文字被遮挡问题
2. 大字模式关闭后显示异常问题
3. 重新调整大字模式是否开启时的字体显示效果

											
										
										
											2026-04-10 20:35:57 +08:00
+								        raise ValueError("batch phase1 chunked: merged segment ids do not match input")
-												feat(eval): server-side replay/phase1 timing + memoir phase1 batch chunking

- Replay and memoir-submit responses include started/finished UTC and elapsed_ms;
  Phase1 poll exposes Redis-backed submit time and elapsed_ms_since_submit.
- Phase1 batch LLM splits segments by memoir_phase1_batch_llm_chunk_size with
  bisect fallback per chunk; Playground shows server timings.

Made-with: Cursor

											
										
										
											2026-04-09 13:38:53 +08:00
+								    return merged