/** * Multi-Turn Tool Call Test (Streaming) * * Simulates Claude Code's streaming multi-turn conversation pattern. * Same flow as non-streaming but verifies: * - SSE events are properly formatted * - signature_delta events are present * - Thinking blocks accumulate correctly across deltas */ const http = require('http'); const BASE_URL = 'localhost'; const PORT = 8080; function streamRequest(body) { return new Promise((resolve, reject) => { const data = JSON.stringify(body); const req = http.request({ host: BASE_URL, port: PORT, path: '/v1/messages', method: 'POST', headers: { 'Content-Type': 'application/json', 'x-api-key': 'test', 'anthropic-version': '2023-06-01', 'anthropic-beta': 'interleaved-thinking-2025-05-14', 'Content-Length': Buffer.byteLength(data) } }, res => { const events = []; let fullData = ''; res.on('data', chunk => { fullData += chunk.toString(); }); res.on('end', () => { // Parse SSE events const parts = fullData.split('\n\n').filter(e => e.trim()); for (const part of parts) { const lines = part.split('\n'); const eventLine = lines.find(l => l.startsWith('event:')); const dataLine = lines.find(l => l.startsWith('data:')); if (eventLine && dataLine) { try { const eventType = eventLine.replace('event:', '').trim(); const eventData = JSON.parse(dataLine.replace('data:', '').trim()); events.push({ type: eventType, data: eventData }); } catch (e) { } } } // Build content from events const content = []; let currentBlock = null; for (const event of events) { if (event.type === 'content_block_start') { currentBlock = { ...event.data.content_block }; if (currentBlock.type === 'thinking') { currentBlock.thinking = ''; currentBlock.signature = ''; } if (currentBlock.type === 'text') currentBlock.text = ''; } else if (event.type === 'content_block_delta') { const delta = event.data.delta; if (delta.type === 'thinking_delta' && currentBlock) { currentBlock.thinking += delta.thinking || ''; } if (delta.type === 'signature_delta' && currentBlock) { currentBlock.signature += delta.signature || ''; } if (delta.type === 'text_delta' && currentBlock) { currentBlock.text += delta.text || ''; } if (delta.type === 'input_json_delta' && currentBlock) { currentBlock.partial_json = (currentBlock.partial_json || '') + delta.partial_json; } } else if (event.type === 'content_block_stop') { if (currentBlock?.type === 'tool_use' && currentBlock.partial_json) { try { currentBlock.input = JSON.parse(currentBlock.partial_json); } catch (e) { } delete currentBlock.partial_json; } if (currentBlock) content.push(currentBlock); currentBlock = null; } } // Check for errors const errorEvent = events.find(e => e.type === 'error'); if (errorEvent) { resolve({ content, events, error: errorEvent.data.error, statusCode: res.statusCode, raw: fullData }); } else { resolve({ content, events, statusCode: res.statusCode, raw: fullData }); } }); }); req.on('error', reject); req.write(data); req.end(); }); } const tools = [{ name: 'execute_command', description: 'Execute a shell command', input_schema: { type: 'object', properties: { command: { type: 'string', description: 'Command to execute' }, cwd: { type: 'string', description: 'Working directory' } }, required: ['command'] } }]; function analyzeContent(content) { const thinking = content.filter(b => b.type === 'thinking'); const toolUse = content.filter(b => b.type === 'tool_use'); const text = content.filter(b => b.type === 'text'); return { thinking, toolUse, text, hasThinking: thinking.length > 0, hasToolUse: toolUse.length > 0, hasText: text.length > 0, thinkingHasSignature: thinking.some(t => t.signature && t.signature.length >= 50) }; } function analyzeEvents(events) { return { messageStart: events.filter(e => e.type === 'message_start').length, blockStart: events.filter(e => e.type === 'content_block_start').length, blockDelta: events.filter(e => e.type === 'content_block_delta').length, blockStop: events.filter(e => e.type === 'content_block_stop').length, messageDelta: events.filter(e => e.type === 'message_delta').length, messageStop: events.filter(e => e.type === 'message_stop').length, thinkingDeltas: events.filter(e => e.data?.delta?.type === 'thinking_delta').length, signatureDeltas: events.filter(e => e.data?.delta?.type === 'signature_delta').length, textDeltas: events.filter(e => e.data?.delta?.type === 'text_delta').length, inputJsonDeltas: events.filter(e => e.data?.delta?.type === 'input_json_delta').length }; } async function runTests() { console.log('='.repeat(60)); console.log('MULTI-TURN TOOL CALL TEST (STREAMING)'); console.log('Simulates Claude Code streaming conversation'); console.log('='.repeat(60)); console.log(''); let messages = []; let allPassed = true; const results = []; // ===== TURN 1: Initial request ===== console.log('TURN 1: User asks to run a command'); console.log('-'.repeat(40)); messages.push({ role: 'user', content: 'Run "ls -la" in the current directory and tell me what files exist.' }); const turn1 = await streamRequest({ model: 'claude-sonnet-4-5-thinking', max_tokens: 4096, stream: true, tools, thinking: { type: 'enabled', budget_tokens: 10000 }, messages }); if (turn1.error) { console.log(` ERROR: ${turn1.error.message}`); allPassed = false; results.push({ name: 'Turn 1: Streaming request', passed: false }); } else { const content = analyzeContent(turn1.content); const events = analyzeEvents(turn1.events); console.log(' Content:'); console.log(` Thinking: ${content.hasThinking ? 'YES' : 'NO'} (${content.thinking.length} blocks)`); console.log(` Signature: ${content.thinkingHasSignature ? 'YES' : 'NO'}`); console.log(` Tool Use: ${content.hasToolUse ? 'YES' : 'NO'} (${content.toolUse.length} calls)`); console.log(' Events:'); console.log(` message_start: ${events.messageStart}`); console.log(` content_block_start/stop: ${events.blockStart}/${events.blockStop}`); console.log(` thinking_delta: ${events.thinkingDeltas}`); console.log(` signature_delta: ${events.signatureDeltas}`); console.log(` input_json_delta: ${events.inputJsonDeltas}`); if (content.hasThinking && content.thinking[0].thinking) { console.log(` Thinking: "${content.thinking[0].thinking.substring(0, 60)}..."`); } if (content.hasToolUse) { console.log(` Tool: ${content.toolUse[0].name}(${JSON.stringify(content.toolUse[0].input)})`); } const passed = content.hasThinking && content.thinkingHasSignature && events.signatureDeltas > 0 && content.hasToolUse; results.push({ name: 'Turn 1: Thinking + Signature + Tool Use + Events', passed }); if (!passed) allPassed = false; if (content.hasToolUse) { messages.push({ role: 'assistant', content: turn1.content }); } } // ===== TURN 2: Provide tool result ===== if (messages.length >= 2) { console.log('\nTURN 2: Provide command output, expect summary'); console.log('-'.repeat(40)); const lastAssistant = messages[messages.length - 1]; const toolUseBlock = lastAssistant.content.find(b => b.type === 'tool_use'); messages.push({ role: 'user', content: [{ type: 'tool_result', tool_use_id: toolUseBlock.id, content: `total 32 drwxr-xr-x 10 user staff 320 Dec 19 10:00 . drwxr-xr-x 5 user staff 160 Dec 19 09:00 .. -rw-r--r-- 1 user staff 1024 Dec 19 10:00 package.json -rw-r--r-- 1 user staff 2048 Dec 19 10:00 README.md drwxr-xr-x 8 user staff 256 Dec 19 10:00 src drwxr-xr-x 4 user staff 128 Dec 19 10:00 tests` }] }); const turn2 = await streamRequest({ model: 'claude-sonnet-4-5-thinking', max_tokens: 4096, stream: true, tools, thinking: { type: 'enabled', budget_tokens: 10000 }, messages }); if (turn2.error) { console.log(` ERROR: ${turn2.error.message}`); allPassed = false; results.push({ name: 'Turn 2: After tool result', passed: false }); } else { const content = analyzeContent(turn2.content); const events = analyzeEvents(turn2.events); console.log(' Content:'); console.log(` Thinking: ${content.hasThinking ? 'YES' : 'NO'} (${content.thinking.length} blocks)`); console.log(` Signature: ${content.thinkingHasSignature ? 'YES' : 'NO'}`); console.log(` Text: ${content.hasText ? 'YES' : 'NO'}`); console.log(' Events:'); console.log(` thinking_delta: ${events.thinkingDeltas}`); console.log(` signature_delta: ${events.signatureDeltas}`); console.log(` text_delta: ${events.textDeltas}`); if (content.hasText && content.text[0].text) { console.log(` Response: "${content.text[0].text.substring(0, 100)}..."`); } const passed = content.hasThinking && content.hasText && events.textDeltas > 0; results.push({ name: 'Turn 2: Thinking + Text response', passed }); if (!passed) allPassed = false; } } // ===== Summary ===== console.log('\n' + '='.repeat(60)); console.log('SUMMARY'); console.log('='.repeat(60)); for (const result of results) { const status = result.passed ? 'PASS' : 'FAIL'; console.log(` [${status}] ${result.name}`); } console.log('\n' + '='.repeat(60)); console.log(`OVERALL: ${allPassed ? 'ALL TESTS PASSED' : 'SOME TESTS FAILED'}`); console.log('='.repeat(60)); process.exit(allPassed ? 0 : 1); } runTests().catch(err => { console.error('Test failed with error:', err); process.exit(1); });