Files
operating-room-monitor-server/app/services/voice_file_log.py
Kevin 3d7bd70355 feat: 手术视频消耗、待确认与持久化改造
- 新增 Alembic 初始迁移、领域明细模型及归档持久化与重试链路\n- 拆分视频会话注册表、分类处理、推理时间窗聚合与流处理\n- 消耗日志:TSV/Markdown 含 top2/top3;item_id 优先产品编码;待确认记「待确认」行,语音确认后落正式行并更新汇总\n- 待确认时内存/DB 明细为占位行,确认后替换;拒绝时移除占位\n- 分类 probs 先 detach/cpu 再转 NumPy,修复 MPS/CUDA 上推理被静默跳过\n- 补充集成测试、归档与设备张量等单测

Made-with: Cursor
2026-04-23 20:42:21 +08:00

207 lines
6.2 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
"""语音确认ASR/解析/审计)的终端 loguru 行 + 每手术 TSV 落盘,与 `consumption_tsv_log` 并列。"""
from __future__ import annotations
import re
import threading
from datetime import datetime, timezone
from pathlib import Path
from zoneinfo import ZoneInfo, ZoneInfoNotFoundError
from loguru import logger
from app.config import Settings
_lock = threading.Lock()
HEADER = (
"时间戳(ISO,UTC)\t来源\t状态\tconfirmation_id\tasr/识别文本\t"
"resolved_label\trejected\terror\taudio_object_key\n"
)
def _ts_iso_utc() -> str:
return datetime.now(timezone.utc).isoformat(timespec="milliseconds")
def _encode_cell(value: str) -> str:
return (value or "").replace("\r", " ").replace("\n", " ").replace("\t", " ")
def _log_tz_info(settings: Settings) -> object:
raw = (settings.consumption_log_timezone or "").strip()
if not raw:
lt = datetime.now().astimezone().tzinfo
return lt if lt is not None else timezone.utc
try:
return ZoneInfo(raw)
except ZoneInfoNotFoundError:
return timezone.utc
def _ts_local_for_display(settings: Settings) -> str:
tz = _log_tz_info(settings)
return datetime.now(tz).isoformat(timespec="milliseconds")
def _safe_surgery_path_segment(surgery_id: str) -> str:
s = (surgery_id or "unknown").strip() or "unknown"
s = re.sub(r"[^\w\-.@]", "_", s)
return s[:200] if len(s) > 200 else s
def resolved_voice_log_path(surgery_id: str, settings: Settings) -> Path:
raw = (settings.voice_file_log_path or "logs/voice_{surgery_id}.txt").strip()
safe = _safe_surgery_path_segment(surgery_id)
if "{surgery_id}" in raw:
raw = raw.replace("{surgery_id}", safe)
else:
p0 = Path(raw)
if p0.suffix:
raw = str(p0.with_name(f"{p0.stem}_{safe}{p0.suffix}"))
else:
raw = f"{raw.rstrip('/')}_{safe}.txt"
p = Path(raw).expanduser()
if not p.is_absolute():
p = Path.cwd() / p
return p
def init_voice_log_file(surgery_id: str, settings: Settings) -> None:
"""与 `init_consumption_log_file` 同生命周期:`start_surgery` 时截断并写表头。"""
if not settings.voice_file_log_enabled:
return
path = resolved_voice_log_path(surgery_id, settings)
path.parent.mkdir(parents=True, exist_ok=True)
with _lock:
with path.open("w", encoding="utf-8") as f:
f.write(HEADER)
def append_voice_tsv_line(surgery_id: str, line: str, settings: Settings) -> None:
if not settings.voice_file_log_enabled:
return
path = resolved_voice_log_path(surgery_id, settings)
path.parent.mkdir(parents=True, exist_ok=True)
with _lock:
with path.open("a", encoding="utf-8") as f:
f.write(line)
class VoiceTextLogWriter:
"""注入式 voice 日志写入器,封装 `init_file` / `emit_event`。
行为等价于模块级函数;保留模块级函数以兼容既有调用点。
"""
def __init__(self, app_settings: Settings) -> None:
self._s = app_settings
def init_file(self, surgery_id: str) -> None:
init_voice_log_file(surgery_id, self._s)
def emit_event(
self,
*,
surgery_id: str,
source: str,
status: str,
confirmation_id: str,
asr_text: str | None = None,
resolved_label: str | None = None,
rejected: str | bool | None = None,
error_message: str | None = None,
audio_object_key: str | None = None,
) -> None:
emit_voice_event(
self._s,
surgery_id=surgery_id,
source=source,
status=status,
confirmation_id=confirmation_id,
asr_text=asr_text,
resolved_label=resolved_label,
rejected=rejected,
error_message=error_message,
audio_object_key=audio_object_key,
)
def emit_voice_event(
settings: Settings,
*,
surgery_id: str,
source: str,
status: str,
confirmation_id: str,
asr_text: str | None = None,
resolved_label: str | None = None,
rejected: str | bool | None = None,
error_message: str | None = None,
audio_object_key: str | None = None,
) -> None:
"""
终端:单条可 grep 的 VoiceConfirm 行文件TSV 一行(与启用的 `voice_file_log_enabled` 一致)。
:param source: `wav` | `text` | `n/a`
:param status: 与审计 `status` 或 `minio_not_configured` 等说明型状态一致
"""
rj: str
if rejected is None:
rj = ""
elif isinstance(rejected, bool):
rj = "true" if rejected else "false"
else:
rj = str(rejected)
ts_utc = _ts_iso_utc()
local_hint = _ts_local_for_display(settings)
if status in ("recognized", "rejected"):
logger.info(
"VoiceConfirm local_ts={!r} surgery_id={} source={} status={} "
"confirmation_id={} asr_text={!r} resolved_label={!r} rejected={} "
"error={!r} audio_key={!r}",
local_hint,
surgery_id,
source,
status,
confirmation_id,
asr_text,
resolved_label,
rj,
error_message,
audio_object_key,
)
else:
logger.warning(
"VoiceConfirm local_ts={!r} surgery_id={} source={} status={} "
"confirmation_id={} asr_text={!r} resolved_label={!r} rejected={} "
"error={!r} audio_key={!r}",
local_hint,
surgery_id,
source,
status,
confirmation_id,
asr_text,
resolved_label,
rj,
error_message,
audio_object_key,
)
if not settings.voice_file_log_enabled:
return
row = [
_encode_cell(ts_utc),
_encode_cell(source),
_encode_cell(status),
_encode_cell(confirmation_id),
_encode_cell("" if asr_text is None else asr_text),
_encode_cell("" if resolved_label is None else resolved_label),
_encode_cell(rj),
_encode_cell("" if error_message is None else error_message),
_encode_cell("" if audio_object_key is None else audio_object_key),
]
line = "\t".join(row) + "\n"
append_voice_tsv_line(surgery_id, line, settings)