392 lines
12 KiB
Python
392 lines
12 KiB
Python
"""后台轮询目录中的 .svo2,逐段跑 FishMeasure,齐套后聚合 final(与 ingest 共用 SQLite)。"""
|
||
|
||
from __future__ import annotations
|
||
|
||
import asyncio
|
||
import hashlib
|
||
from pathlib import Path
|
||
from typing import Dict, List, Set, Tuple
|
||
|
||
from loguru import logger
|
||
|
||
from app.compat import to_thread
|
||
|
||
from app.db import (
|
||
add_watch_processed,
|
||
load_watch_processed,
|
||
measure_snapshot_deliverable,
|
||
save_measure_snapshot,
|
||
)
|
||
from app.services import measure as measure_svc
|
||
from app.settings import Settings
|
||
from app.state import app_state
|
||
from app.watch_idle import IdleWatchWarnState, idle_warn_interval_sec, maybe_warn_idle_watch
|
||
|
||
_MEASURE_IDLE_WARN_INTERVAL_SEC = idle_warn_interval_sec(
|
||
"FISH_MEASURE_WATCH_IDLE_WARN_INTERVAL_SEC"
|
||
)
|
||
|
||
|
||
def _state_path(settings: Settings) -> Path:
|
||
"""返回旧版 JSON 状态文件路径(仅用于兼容导入 SQLite)。"""
|
||
assert settings.measure_watch_dir is not None
|
||
return settings.measure_watch_dir / ".fishmeasure_watch_processed.json"
|
||
|
||
|
||
def iter_svo2_folders(watch_dir: Path) -> List[Tuple[List[Path], str]]:
|
||
"""扫描子文件夹,返回 (svo文件路径列表, fish_id) 列表。
|
||
|
||
文件夹命名格式为 fish{N}。每个子文件夹内多个 .svo2 先逐段测量,齐套后再聚合 final。
|
||
"""
|
||
result = [] # type: List[Tuple[List[Path], str]]
|
||
if not watch_dir.is_dir():
|
||
return result
|
||
|
||
for entry in sorted(watch_dir.iterdir()):
|
||
if not entry.is_dir():
|
||
continue
|
||
folder_name = entry.name
|
||
if not folder_name.startswith("fish"):
|
||
continue
|
||
try:
|
||
fish_id = folder_name[4:]
|
||
if not fish_id.isdigit():
|
||
continue
|
||
except (IndexError, ValueError):
|
||
continue
|
||
|
||
svo_files = sorted([
|
||
p for p in entry.iterdir()
|
||
if p.is_file() and p.suffix.lower() == ".svo2"
|
||
])
|
||
if svo_files:
|
||
result.append((svo_files, fish_id))
|
||
|
||
return result
|
||
|
||
|
||
def _final_processed_key(fish_id: str, svo_list: List[Path]) -> str:
|
||
sig = "|".join(sorted(str(p.resolve()) for p in svo_list))
|
||
h = hashlib.sha256(sig.encode("utf-8")).hexdigest()[:24]
|
||
return f"__measure_final__fish{fish_id}:{h}"
|
||
|
||
|
||
def _folder_size_tuple(svo_list: List[Path]) -> Tuple[Tuple[str, int], ...]:
|
||
out: List[Tuple[str, int]] = []
|
||
for p in sorted(svo_list, key=lambda x: str(x.resolve())):
|
||
try:
|
||
st = p.stat()
|
||
out.append((str(p.resolve()), int(st.st_size)))
|
||
except OSError:
|
||
return tuple()
|
||
return tuple(out)
|
||
|
||
|
||
async def _run_single_svo_measure(
|
||
svo: Path,
|
||
fish_id: str,
|
||
settings: Settings,
|
||
processed: Set[str],
|
||
state_file: Path,
|
||
) -> None:
|
||
key = str(svo.resolve())
|
||
fish_folder = svo.parent.resolve()
|
||
fish_output_root = settings.measure_output_root / f"fish{fish_id}"
|
||
fish_output_root.mkdir(parents=True, exist_ok=True)
|
||
|
||
logger.info(
|
||
"[measure-watch] segment inference fish_id={} svo={}",
|
||
fish_id,
|
||
svo.name,
|
||
)
|
||
|
||
async with app_state.measure_lock:
|
||
app_state.measure_status = "running"
|
||
try:
|
||
|
||
def _run():
|
||
with app_state.measure_thread_lock:
|
||
return measure_svc.run_full_measure(
|
||
svo, settings, output_root=fish_output_root
|
||
)
|
||
|
||
snap = await to_thread(_run)
|
||
|
||
snap = measure_svc.tag_measure_snapshot_meta(
|
||
snap,
|
||
measurement_phase="segment",
|
||
fish_folder=str(fish_folder),
|
||
segment_source=str(svo.resolve()),
|
||
)
|
||
|
||
if measure_snapshot_deliverable(snap):
|
||
save_measure_snapshot(
|
||
settings,
|
||
snap,
|
||
source_path=str(svo.resolve()),
|
||
client_id=None,
|
||
)
|
||
else:
|
||
logger.warning(
|
||
"[measure-watch] no deliverable measure rows for fish_id={} svo={}, skip SQLite",
|
||
fish_id,
|
||
svo.name,
|
||
)
|
||
|
||
app_state.measure_status = "idle"
|
||
processed.add(key)
|
||
if settings.measure_watch_use_state_file:
|
||
add_watch_processed(settings, key, "measure")
|
||
|
||
r0 = snap.result[0] if snap.result else {}
|
||
logger.info(
|
||
"[measure-watch] segment done: fish_id={} svo={} weight={!r}",
|
||
fish_id,
|
||
svo.name,
|
||
r0.get("weight", ""),
|
||
)
|
||
|
||
except (RuntimeError, FileNotFoundError) as e:
|
||
logger.warning(
|
||
"[measure-watch] measure failed fish_id={} svo={}: {}",
|
||
fish_id,
|
||
svo.name,
|
||
e,
|
||
)
|
||
app_state.measure_status = "idle"
|
||
processed.add(key)
|
||
if settings.measure_watch_use_state_file:
|
||
add_watch_processed(settings, key, "measure")
|
||
|
||
except Exception as e:
|
||
logger.exception(
|
||
"[measure-watch] error fish_id={} svo={}: {}",
|
||
fish_id,
|
||
svo.name,
|
||
e,
|
||
)
|
||
app_state.measure_status = "idle"
|
||
processed.add(key)
|
||
if settings.measure_watch_use_state_file:
|
||
add_watch_processed(settings, key, "measure")
|
||
|
||
|
||
async def _run_final_aggregate(
|
||
svo_list: List[Path],
|
||
fish_id: str,
|
||
settings: Settings,
|
||
processed: Set[str],
|
||
state_file: Path,
|
||
final_key: str,
|
||
) -> None:
|
||
fish_folder = svo_list[0].parent.resolve()
|
||
|
||
logger.info(
|
||
"[measure-watch] final aggregate fish_id={} {} segment(s)",
|
||
fish_id,
|
||
len(svo_list),
|
||
)
|
||
|
||
async with app_state.measure_lock:
|
||
app_state.measure_status = "running"
|
||
try:
|
||
|
||
def _reload():
|
||
return measure_svc.reload_segment_snapshots_for_aggregate(
|
||
svo_list, fish_id, settings
|
||
)
|
||
|
||
pairs = await to_thread(_reload)
|
||
contributing_svos = [p[0] for p in pairs]
|
||
segments = [p[1] for p in pairs]
|
||
paths_joined = "|".join(sorted(str(p.resolve()) for p in contributing_svos))
|
||
|
||
snap = measure_svc.build_measure_snapshot_aggregate(
|
||
segments,
|
||
fish_id,
|
||
settings,
|
||
contributing_svos=contributing_svos,
|
||
fish_folder=str(fish_folder),
|
||
segment_source_paths=paths_joined,
|
||
)
|
||
|
||
if measure_snapshot_deliverable(snap):
|
||
try:
|
||
v_left, v_right = await to_thread(
|
||
measure_svc.generate_aggregate_preview_media,
|
||
contributing_svos,
|
||
snap,
|
||
fish_id,
|
||
settings,
|
||
final_key=final_key,
|
||
)
|
||
snap.video_left = v_left
|
||
snap.video_right = v_right
|
||
except Exception as e:
|
||
logger.warning(
|
||
"[measure-watch] final preview generate failed fish_id={}: {}",
|
||
fish_id,
|
||
e,
|
||
)
|
||
save_measure_snapshot(
|
||
settings,
|
||
snap,
|
||
source_path=f"aggregate:{final_key}",
|
||
client_id=None,
|
||
)
|
||
else:
|
||
logger.warning(
|
||
"[measure-watch] final not deliverable for fish_id={}, skip SQLite",
|
||
fish_id,
|
||
)
|
||
|
||
app_state.measure_status = "idle"
|
||
processed.add(final_key)
|
||
if settings.measure_watch_use_state_file:
|
||
add_watch_processed(settings, final_key, "measure")
|
||
|
||
r0 = snap.result[0] if snap.result else {}
|
||
logger.info(
|
||
"[measure-watch] final done: fish_id={} weight={!r}",
|
||
fish_id,
|
||
r0.get("weight", ""),
|
||
)
|
||
|
||
except Exception as e:
|
||
logger.exception(
|
||
"[measure-watch] final aggregate failed fish_id={}: {}",
|
||
fish_id,
|
||
e,
|
||
)
|
||
app_state.measure_status = "idle"
|
||
processed.add(final_key)
|
||
if settings.measure_watch_use_state_file:
|
||
add_watch_processed(settings, final_key, "measure")
|
||
|
||
|
||
async def watch_tick(
|
||
settings: Settings,
|
||
processed: Set[str],
|
||
stability: Dict[str, Tuple[int, int]],
|
||
final_stability: Dict[str, Tuple[Tuple[Tuple[str, int], ...], int]],
|
||
state_file: Path,
|
||
) -> bool:
|
||
"""逐段稳定即测量;同一 fish 目录全部段已处理且整体稳定后写 final。"""
|
||
assert settings.measure_watch_dir is not None
|
||
watch_dir = settings.measure_watch_dir
|
||
did = False
|
||
seen_keys: Set[str] = set()
|
||
|
||
for svo_list, fish_id in iter_svo2_folders(watch_dir):
|
||
if not svo_list:
|
||
continue
|
||
|
||
fish_folder = svo_list[0].parent
|
||
folder_key = str(fish_folder.resolve())
|
||
|
||
for svo in svo_list:
|
||
key = str(svo.resolve())
|
||
seen_keys.add(key)
|
||
|
||
if key in processed:
|
||
continue
|
||
|
||
try:
|
||
st = svo.stat()
|
||
except OSError:
|
||
continue
|
||
|
||
size = int(st.st_size)
|
||
if size <= 0:
|
||
stability.pop(key, None)
|
||
continue
|
||
|
||
last = stability.get(key)
|
||
if last is None or last[0] != size:
|
||
stability[key] = (size, 1)
|
||
else:
|
||
_, cnt = last
|
||
cnt += 1
|
||
stability[key] = (size, cnt)
|
||
if cnt >= settings.measure_watch_stable_polls:
|
||
await _run_single_svo_measure(
|
||
svo, fish_id, settings, processed, state_file
|
||
)
|
||
stability.pop(key, None)
|
||
did = True
|
||
|
||
fk = _final_processed_key(fish_id, svo_list)
|
||
if fk in processed:
|
||
continue
|
||
|
||
if not all(str(p.resolve()) in processed for p in svo_list):
|
||
final_stability.pop(folder_key, None)
|
||
continue
|
||
|
||
tup = _folder_size_tuple(svo_list)
|
||
if not tup:
|
||
continue
|
||
|
||
prev = final_stability.get(folder_key)
|
||
if prev is None or prev[0] != tup:
|
||
final_stability[folder_key] = (tup, 1)
|
||
else:
|
||
_, c = prev
|
||
c += 1
|
||
final_stability[folder_key] = (tup, c)
|
||
if c >= settings.measure_watch_stable_polls:
|
||
await _run_final_aggregate(
|
||
svo_list, fish_id, settings, processed, state_file, fk
|
||
)
|
||
final_stability.pop(folder_key, None)
|
||
did = True
|
||
|
||
for k in list(stability.keys()):
|
||
if k not in seen_keys:
|
||
del stability[k]
|
||
|
||
return did
|
||
|
||
|
||
async def run_measure_watch_loop(settings: Settings) -> None:
|
||
assert settings.measure_watch_dir is not None
|
||
wd = settings.measure_watch_dir
|
||
if not wd.is_dir():
|
||
logger.warning("[measure-watch] skip: not a directory: {}", wd)
|
||
return
|
||
|
||
state_file = _state_path(settings)
|
||
processed: Set[str] = (
|
||
load_watch_processed(settings, state_file, "measure")
|
||
if settings.measure_watch_use_state_file
|
||
else set()
|
||
)
|
||
stability = {} # type: Dict[str, Tuple[int, int]]
|
||
final_stability = {} # type: Dict[str, Tuple[Tuple[Tuple[str, int], ...], int]]
|
||
|
||
logger.info(
|
||
"[measure-watch] watching {} (poll={}s, stable_polls={}, aggregate={}, state={} {})",
|
||
wd,
|
||
settings.measure_watch_poll_interval,
|
||
settings.measure_watch_stable_polls,
|
||
settings.measure_final_aggregate_mode,
|
||
"on" if settings.measure_watch_use_state_file else "off",
|
||
state_file if settings.measure_watch_use_state_file else "",
|
||
)
|
||
|
||
idle_warn_state = IdleWatchWarnState()
|
||
while True:
|
||
did = await watch_tick(
|
||
settings, processed, stability, final_stability, state_file
|
||
)
|
||
maybe_warn_idle_watch(
|
||
did_work=did,
|
||
log_tag="measure-watch",
|
||
algo_name="FishMeasure",
|
||
idle_hint="目录内无 fish{N} 子文件夹、已全部处理完毕,或文件尚未达到稳定轮询次数",
|
||
watch_dir=wd,
|
||
state=idle_warn_state,
|
||
interval_sec=_MEASURE_IDLE_WARN_INTERVAL_SEC,
|
||
)
|
||
await asyncio.sleep(max(settings.measure_watch_poll_interval, 0.1))
|