feat(vela): start mocked response flow after push-to-talk commit

This commit is contained in:
2026-04-08 21:20:17 +02:00
parent 98bcc543f5
commit 28712443cc
8 changed files with 284 additions and 25 deletions

View File

@@ -105,6 +105,7 @@ test('voice session shell supports a placeholder mic-control cycle before anothe
await expect(page.getByTestId('user-transcript')).toHaveText(
'[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
);
await expect(page.getByTestId('assistant-response')).toHaveText(MOCKED_ASSISTANT_RESPONSE);
await expect(page.getByTestId('partial-transcript')).toHaveText('none');
await expect(page.getByTestId('gateway-session-state')).toHaveText('idle');
await expect(page.getByTestId('mocked-turn-button')).toBeEnabled();
@@ -114,3 +115,34 @@ test('voice session shell supports a placeholder mic-control cycle before anothe
await expect(page.getByTestId('assistant-response')).toHaveText(MOCKED_ASSISTANT_RESPONSE);
await expect(page.getByTestId('mocked-turn-status')).toHaveText('idle');
});
test('voice session shell can cancel a push-to-talk mocked response and start another turn', async ({ page }) => {
await page.goto('/');
await expect(page.getByTestId('hydration-status')).toHaveText('ready');
await page.getByTestId('connect-button').click();
await expect(page.getByTestId('connection-state')).toHaveText('connected');
await page.getByTestId('mic-control-button').dispatchEvent('mousedown');
await expect(page.getByTestId('gateway-session-state')).toHaveText('listening');
await page.getByTestId('mic-control-button').dispatchEvent('mouseup');
await expect(page.getByTestId('user-transcript')).toHaveText(
'[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
);
await expect(page.getByTestId('cancel-turn-button')).toBeEnabled();
await expect(page.getByTestId('assistant-response')).toContainText('[mocked assistant]');
await page.getByTestId('cancel-turn-button').click();
await expect(page.getByTestId('gateway-session-state')).toHaveText('idle');
await expect(page.getByTestId('mocked-turn-status')).toHaveText('idle');
await expect(page.getByTestId('user-transcript')).toHaveText(
'[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
);
await expect(page.getByTestId('assistant-response')).toContainText('[mocked assistant]');
await expect(page.getByTestId('mocked-turn-button')).toBeEnabled();
await page.getByTestId('mocked-turn-button').click();
await expect(page.getByTestId('assistant-response')).toHaveText(MOCKED_ASSISTANT_RESPONSE);
await expect(page.getByTestId('mocked-turn-status')).toHaveText('idle');
});

View File

@@ -53,6 +53,7 @@
let inProgressPartialTranscript = 'none';
let mockedAssistantResponse = 'none';
let mockedTurnInFlight = false;
let assistantResponseExpected = false;
let mockedConversationRenderOrder = [];
let micControlActive = false;
let hydrationStatus = 'mounting';
@@ -78,6 +79,7 @@
connectionState === 'connected' &&
socket?.readyState === WebSocket.OPEN &&
sessionReadyReceived &&
gatewaySessionState === 'idle' &&
!mockedTurnInFlight;
function clearSocketHandlers(targetSocket) {
@@ -96,6 +98,7 @@
inProgressPartialTranscript = 'none';
mockedAssistantResponse = 'none';
mockedTurnInFlight = false;
assistantResponseExpected = false;
mockedConversationRenderOrder = [];
micControlActive = false;
}
@@ -125,6 +128,7 @@
}
connectionDetail = 'Mic control shell released. Sending placeholder input_audio.commit.';
assistantResponseExpected = true;
socket.send(JSON.stringify(createMessageEnvelope('input_audio.commit', {})));
}
@@ -150,6 +154,7 @@
inProgressPartialTranscript = 'none';
mockedAssistantResponse = 'waiting for mocked response…';
mockedTurnInFlight = true;
assistantResponseExpected = true;
lastError = 'none';
socket.send(JSON.stringify(createMessageEnvelope('mocked.turn.trigger', {})));
}
@@ -235,6 +240,7 @@
gatewaySessionState = message.payload.value;
if (message.payload.value === 'idle') {
mockedTurnInFlight = false;
assistantResponseExpected = false;
}
return;
}
@@ -242,7 +248,8 @@
if (message.type === 'transcript.final') {
inProgressPartialTranscript = 'none';
mockedUserTranscript = message.payload.text;
if (mockedTurnInFlight) {
if (assistantResponseExpected) {
mockedTurnInFlight = true;
mockedAssistantResponse = '…';
}
if (!mockedConversationRenderOrder.includes('transcript')) {
@@ -276,12 +283,14 @@
if (message.type === 'response.completed') {
mockedTurnInFlight = false;
assistantResponseExpected = false;
return;
}
if (message.type === 'error') {
if (message.payload.retryable === false) {
mockedTurnInFlight = false;
assistantResponseExpected = false;
connectionState = 'error';
connectionDetail = 'Gateway reported a protocol error.';
} else {

View File

@@ -93,7 +93,7 @@ describe('voice session shell', () => {
});
});
it('runs a placeholder mic-control cycle and keeps mocked turn usable on the same socket', async () => {
it('runs a placeholder mic-control cycle, streams mocked assistant text, and keeps mocked turn usable on the same socket', async () => {
render(VoiceSessionShell);
await fireEvent.click(getByTestId('connect-button'));
@@ -154,6 +154,15 @@ describe('voice session shell', () => {
text: '[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
})
);
socket.message(createMessageEnvelope('session.state', { value: 'thinking' }));
socket.message(createMessageEnvelope('session.state', { value: 'speaking' }));
socket.message(createMessageEnvelope('response.text.delta', { text: '[mocked assistant] ' }));
socket.message(
createMessageEnvelope('response.text.delta', {
text: 'This is a deterministic mocked response from the gateway vertical slice.'
})
);
socket.message(createMessageEnvelope('response.completed', {}));
socket.message(createMessageEnvelope('session.state', { value: 'idle' }));
@@ -163,6 +172,9 @@ describe('voice session shell', () => {
expect(getByTestId('user-transcript').textContent).toBe(
'[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
);
expect(getByTestId('assistant-response').textContent).toBe(
'[mocked assistant] This is a deterministic mocked response from the gateway vertical slice.'
);
expect(getByTestId('partial-transcript').textContent).toBe('none');
});
@@ -172,6 +184,61 @@ describe('voice session shell', () => {
expect(JSON.parse(socket.sent[2]).type).toBe('mocked.turn.trigger');
});
it('keeps rendered push-to-talk transcript and assistant text visible after cancel', async () => {
render(VoiceSessionShell);
await fireEvent.click(getByTestId('connect-button'));
const socket = MockWebSocket.latest();
socket.open();
socket.message(createMessageEnvelope('session.ready', { sessionId: 'session-ptt-cancel' }));
socket.message(createMessageEnvelope('session.state', { value: 'idle' }));
await waitFor(() => {
expect(getByTestId('mic-control-button').hasAttribute('disabled')).toBe(false);
});
await fireEvent.mouseDown(getByTestId('mic-control-button'));
socket.message(createMessageEnvelope('session.state', { value: 'listening' }));
socket.message(
createMessageEnvelope('transcript.partial', {
text: '[mocked partial] Placeholder push-to-talk transcript in progress.'
})
);
await fireEvent.mouseUp(getByTestId('mic-control-button'));
expect(JSON.parse(socket.sent[1]).type).toBe('input_audio.commit');
socket.message(
createMessageEnvelope('transcript.final', {
text: '[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
})
);
socket.message(createMessageEnvelope('session.state', { value: 'thinking' }));
socket.message(createMessageEnvelope('session.state', { value: 'speaking' }));
socket.message(createMessageEnvelope('response.text.delta', { text: '[mocked assistant] ' }));
await waitFor(() => {
expect(getByTestId('cancel-turn-button').hasAttribute('disabled')).toBe(false);
expect(getByTestId('assistant-response').textContent).toBe('[mocked assistant] ');
});
await fireEvent.click(getByTestId('cancel-turn-button'));
expect(JSON.parse(socket.sent[2]).type).toBe('response.cancel');
socket.message(createMessageEnvelope('session.state', { value: 'idle' }));
await waitFor(() => {
expect(getByTestId('gateway-session-state').textContent).toBe('idle');
expect(getByTestId('mocked-turn-status').textContent).toBe('idle');
expect(getByTestId('cancel-turn-button').hasAttribute('disabled')).toBe(true);
expect(getByTestId('user-transcript').textContent).toBe(
'[mocked final] Placeholder push-to-talk transcript completed from 1 appended chunk.'
);
expect(getByTestId('assistant-response').textContent).toBe('[mocked assistant] ');
expect(getByTestId('mic-control-button').hasAttribute('disabled')).toBe(false);
});
});
it('renders mocked transcript before assistant response for a connected session', async () => {
render(VoiceSessionShell);