fix(voice): queue split TTS segments after pause without replacing track

Detect consecutive tts_auto items on the same assistant bubble via listKey (uuid_seg_n / uuid_part_n). When paused, skip the 'clear queue and play latest only' path so later segments enqueue instead of wiping playback. Add regression test. Co-authored-by: Cursor <cursoragent@cursor.com>
2026-05-15 17:25:44 +08:00
parent 6452019a1e
commit ddc701f22d
2 changed files with 98 additions and 3 deletions
--- a/app-expo/src/features/voice/hooks/use-player.ts
+++ b/app-expo/src/features/voice/hooks/use-player.ts
@@ -5,6 +5,39 @@ import { audioFocus } from '@/core/audio/audio-focus';
 import type { PlaybackItem, PlayerStatus } from '../types';
 /**
 * `handleTtsSegment` 使用 `assistantSegmentMessageId` → `{uuid}_seg_{n}`；
 * 展平气泡使用 `{uuid}_part_{n}`。同一条落库助手消息上的连续分段应用入队续播，
 * 而不是「暂停后又到一条 tts_auto 就整轨切换成最新」——否则多段朗读只会听到最后一段。
 */
 function parseAssistantSplitListKey(listKey: string | undefined): {
  messageId: string;
  segmentIndex: number;
 } | null {
  if (!listKey) return null;
  const m =
    /^([0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12})_(?:seg|part)_(\d+)$/i.exec(
      listKey,
    );
  if (!m) return null;
  return { messageId: m[1]!, segmentIndex: Number(m[2]) };
 }
 function isLaterSegmentOfSameAssistantBubble(
  current: PlaybackItem | null | undefined,
  incoming: PlaybackItem,
 ): boolean {
  if (incoming.kind !== 'tts_auto' || current?.kind !== 'tts_auto') {
    return false;
  }
  const a = parseAssistantSplitListKey(current.messageRef?.listKey);
  const b = parseAssistantSplitListKey(incoming.messageRef?.listKey);
  if (!a || !b) return false;
  return (
    a.messageId === b.messageId && b.segmentIndex > a.segmentIndex
  );
 }
 interface UsePlayerResult {
  status: PlayerStatus;
  queueLength: number;
@@ -40,6 +73,8 @@ export function usePlayer(): UsePlayerResult {
  const isPlayingRef = useRef(false);
  const wasBlockedByRecorderRef = useRef(false);
  const isPlayNextInProgressRef = useRef(false);
  /** 供 `enqueue` 判断「同一条助手消息的下一段 TTS」；不依赖 React state 闭包陈旧。 */
  const currentPlaybackItemRef = useRef<PlaybackItem | null>(null);
  /** 与 `status` 同步；`pausePlayback` 等在同一事件循环内立即更新，避免 WS 紧跟着 `enqueue(tts_auto)` 时读到陈旧 `playing`。 */
  const statusRef = useRef<PlayerStatus>('idle');
  /** 同步反映「当前是否正在播放某条 URI」；enqueue 不能依赖 state，否则 await stop() 后仍为陈旧闭包。 */
@@ -69,6 +104,10 @@ export function usePlayer(): UsePlayerResult {
    statusRef.current = status;
  }, [status]);
  useEffect(() => {
    currentPlaybackItemRef.current = currentPlaybackItem;
  }, [currentPlaybackItem]);
  /**
   * 必须在 `isLoaded` 之后再 `play()`。
   * expo-audio 在 `downloadFirst: true` 时先用 null 建 player，再在内部 effect 里异步
@@ -206,10 +245,23 @@ export function usePlayer(): UsePlayerResult {
    async (item: PlaybackItem) => {
      /**
       * 用户在助手自动朗读中途点暂停时，`playbackActiveUriRef` 仍指向当前条，
-       * 后续 `tts_auto` 只会堆在队列里且不会 `playNext`。
+       * 后续 `tts_auto` 默认堆在队列里且不会 `playNext`。
-       * 新片段到达时表示「最新已生成」：清掉暂停态与积压队列，只播本条。
+       * 无分段 listKey 时：新片段到达表示「另一条 / 最新一条」应只播它 → 清暂停态与队列。
       * 有 `{uuid}_seg_{n}` 且 n 递增：同一落库助手消息的多段 TTS → 只入队，不抢轨。
       */
-      if (item.kind === 'tts_auto' && statusRef.current === 'paused') {
+      const skipPausedClearForSplitContinue =
        item.kind === 'tts_auto' &&
        statusRef.current === 'paused' &&
        isLaterSegmentOfSameAssistantBubble(
          currentPlaybackItemRef.current,
          item,
        );
      if (
        item.kind === 'tts_auto' &&
        statusRef.current === 'paused' &&
        !skipPausedClearForSplitContinue
      ) {
        queueRef.current = [];
        setQueueLength(0);
        isPlayingRef.current = false;
--- a/app-expo/tests/features/voice/use-player.test.tsx
+++ b/app-expo/tests/features/voice/use-player.test.tsx
@@ -207,4 +207,47 @@ describe('usePlayer', () => {
    expect(play.mock.calls.length).toBeGreaterThan(playCountAfterFirst);
    expect(result.current.currentSource).toBe('file:///latest.mp3');
  });
  test('after pause, next uuid_seg tts_auto queues without replacing current (multi-segment TTS)', async () => {
    const aid = '78b32c06-d2f9-453b-9cc4-354e68fbcb2d';
    mockUseAudioPlayerStatus.mockReturnValue({
      isLoaded: true,
      playing: false,
      currentTime: 0.1,
      duration: 10,
    });
    const pause = jest.fn();
    const play = jest.fn();
    mockUseAudioPlayer.mockReturnValue({ pause, play });
    const { result } = renderHook(() => usePlayer());
    await act(async () => {
      await result.current.enqueue({
        uri: 'file:///seg0.mp3',
        kind: 'tts_auto',
        messageRef: { listKey: `${aid}_seg_0` },
      });
    });
    expect(result.current.status).toBe('playing');
    expect(result.current.currentSource).toBe('file:///seg0.mp3');
    act(() => {
      result.current.pausePlayback();
    });
    expect(result.current.status).toBe('paused');
    await act(async () => {
      await result.current.enqueue({
        uri: 'file:///seg1.mp3',
        kind: 'tts_auto',
        messageRef: { listKey: `${aid}_seg_1` },
      });
    });
    expect(result.current.status).toBe('paused');
    expect(result.current.currentSource).toBe('file:///seg0.mp3');
    expect(result.current.queueLength).toBe(1);
  });
 });