CodebuffAI
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎backend/src/__tests__/subagent-streaming.test.ts‎
Lines changed: 247 additions & 0 deletions b/‎backend/src/__tests__/subagent-streaming.test.ts‎
Lines changed: 247 additions & 0 deletions
diff --git a/‎backend/src/tools/handlers/spawn-agents-async.ts‎
Lines changed: 18 additions & 3 deletions b/‎backend/src/tools/handlers/spawn-agents-async.ts‎
Lines changed: 18 additions & 3 deletions
@@ -120,7 +120,7 @@ jobs:
         with:
           timeout_minutes: 10
           max_attempts: 5
-          command: cd ${{ matrix.package }} && bun test $(find src -name '*.test.ts' ! -name '*.integration.test.ts')
+          command: cd ${{ matrix.package }} && find src -name '*.test.ts' ! -name '*.integration.test.ts' | sort | xargs -I {} bun test {}
 
       # - name: Open interactive debug shell
       #   if: ${{ failure() }}
@@ -180,7 +180,7 @@ jobs:
         with:
           timeout_minutes: 15
           max_attempts: 3
-          command: cd ${{ matrix.package }} && bun test $(find src -name '*.integration.test.ts')
+          command: cd ${{ matrix.package }} && find src -name '*.integration.test.ts' | sort | xargs -I {} bun test {}
 
       # - name: Open interactive debug shell
       #   if: ${{ failure() }}
 
@@ -0,0 +1,247 @@
+import { TEST_USER_ID } from '@codebuff/common/constants'
+import { getInitialSessionState } from '@codebuff/common/types/session-state'
+import {
+  afterAll,
+  beforeAll,
+  beforeEach,
+  describe,
+  expect,
+  it,
+  Mock,
+  mock,
+  spyOn,
+} from 'bun:test'
+import { WebSocket } from 'ws'
+
+import * as runAgentStep from '../run-agent-step'
+import * as agentRegistryModule from '../templates/agent-registry'
+import { AgentTemplate } from '../templates/types'
+import {
+  handleSpawnAgents,
+  SendSubagentChunk,
+} from '../tools/handlers/spawn-agents'
+import * as loggerModule from '../util/logger'
+import { mockFileContext, MockWebSocket } from './test-utils'
+
+describe('Subagent Streaming', () => {
+  let mockSendSubagentChunk: Mock<SendSubagentChunk>
+  let mockLoopAgentSteps: Mock<(typeof runAgentStep)['loopAgentSteps']>
+
+  beforeAll(() => {
+    // Mock dependencies
+    spyOn(loggerModule.logger, 'debug').mockImplementation(() => {})
+    spyOn(loggerModule.logger, 'error').mockImplementation(() => {})
+    spyOn(loggerModule.logger, 'info').mockImplementation(() => {})
+    spyOn(loggerModule.logger, 'warn').mockImplementation(() => {})
+    spyOn(loggerModule, 'withLoggerContext').mockImplementation(
+      async (context: any, fn: () => Promise<any>) => fn()
+    )
+
+    // Mock sendSubagentChunk function to capture streaming messages
+    mockSendSubagentChunk = mock(
+      (data: {
+        userInputId: string
+        agentId: string
+        agentType: string
+        chunk: string
+        prompt?: string
+      }) => {}
+    )
+
+    // Mock loopAgentSteps to simulate subagent execution with streaming
+    mockLoopAgentSteps = spyOn(
+      runAgentStep,
+      'loopAgentSteps'
+    ).mockImplementation(async (ws, options) => {
+      // Simulate streaming chunks by calling the callback
+      if (options.onResponseChunk) {
+        options.onResponseChunk('Thinking about the problem...')
+        options.onResponseChunk('Found a solution!')
+      }
+
+      return {
+        agentState: {
+          ...options.agentState,
+          messageHistory: [
+            { role: 'assistant', content: 'Test response from subagent' },
+          ],
+        },
+      }
+    })
+
+    // Mock agent registry
+    spyOn(agentRegistryModule.agentRegistry, 'initialize').mockImplementation(
+      async () => {}
+    )
+    spyOn(
+      agentRegistryModule.agentRegistry,
+      'getAllTemplates'
+    ).mockImplementation(() => ({
+      thinker: {
+        id: 'thinker',
+        name: 'Thinker',
+        outputMode: 'last_message',
+        promptSchema: {
+          prompt: {
+            safeParse: () => ({ success: true }),
+          } as any,
+        },
+        purpose: '',
+        model: '',
+        includeMessageHistory: true,
+        toolNames: [],
+        spawnableAgents: [],
+        initialAssistantMessage: '',
+        initialAssistantPrefix: '',
+        stepAssistantMessage: '',
+        stepAssistantPrefix: '',
+        systemPrompt: '',
+        userInputPrompt: '',
+        agentStepPrompt: '',
+      },
+    }))
+    spyOn(agentRegistryModule.agentRegistry, 'getAgentName').mockImplementation(
+      () => 'Thinker'
+    )
+  })
+
+  beforeEach(() => {
+    mockSendSubagentChunk.mockClear()
+    mockLoopAgentSteps.mockClear()
+  })
+
+  afterAll(() => {
+    mock.restore()
+  })
+
+  it('should send subagent-response-chunk messages during agent execution', async () => {
+    const ws = new MockWebSocket() as unknown as WebSocket
+    const sessionState = getInitialSessionState(mockFileContext)
+    const agentState = sessionState.mainAgentState
+
+    // Mock parent agent template that can spawn thinker
+    const parentTemplate = {
+      id: 'base',
+      spawnableAgents: ['thinker'],
+    } as unknown as AgentTemplate
+
+    const toolCall = {
+      toolName: 'spawn_agents' as const,
+      toolCallId: 'test-tool-call-id',
+      args: {
+        agents: [
+          {
+            agent_type: 'thinker',
+            prompt: 'Think about this problem',
+          },
+        ],
+      },
+    }
+
+    const { result } = handleSpawnAgents({
+      previousToolCallFinished: Promise.resolve(),
+      toolCall,
+      fileContext: mockFileContext,
+      clientSessionId: 'test-session',
+      userInputId: 'test-input',
+      getLatestState: () => ({ messages: [] }),
+      state: {
+        ws,
+        fingerprintId: 'test-fingerprint',
+        userId: TEST_USER_ID,
+        agentTemplate: parentTemplate,
+        sendSubagentChunk: mockSendSubagentChunk,
+        messages: [],
+        agentState,
+      },
+    })
+
+    await result
+
+    // Verify that subagent streaming messages were sent
+    expect(mockSendSubagentChunk).toHaveBeenCalledTimes(2)
+
+    // Check first streaming chunk
+    expect(mockSendSubagentChunk).toHaveBeenNthCalledWith(1, {
+      userInputId: 'test-input',
+      agentId: expect.any(String),
+      agentType: 'thinker',
+      chunk: 'Thinking about the problem...',
+      prompt: 'Think about this problem',
+    })
+
+    // Check second streaming chunk
+    expect(mockSendSubagentChunk).toHaveBeenNthCalledWith(2, {
+      userInputId: 'test-input',
+      agentId: expect.any(String),
+      agentType: 'thinker',
+      chunk: 'Found a solution!',
+      prompt: 'Think about this problem',
+    })
+  })
+
+  it('should include correct agentId and agentType in streaming messages', async () => {
+    const ws = new MockWebSocket() as unknown as WebSocket
+    const sessionState = getInitialSessionState(mockFileContext)
+    const agentState = sessionState.mainAgentState
+
+    const parentTemplate = {
+      id: 'base',
+      spawnableAgents: ['thinker'],
+    } as unknown as AgentTemplate
+
+    const toolCall = {
+      toolName: 'spawn_agents' as const,
+      toolCallId: 'test-tool-call-id-2',
+      args: {
+        agents: [
+          {
+            agent_type: 'thinker',
+            prompt: 'Test prompt',
+          },
+        ],
+      },
+    }
+
+    const { result } = handleSpawnAgents({
+      previousToolCallFinished: Promise.resolve(),
+      toolCall,
+      fileContext: mockFileContext,
+      clientSessionId: 'test-session',
+      userInputId: 'test-input-123',
+      getLatestState: () => ({ messages: [] }),
+      state: {
+        ws,
+        fingerprintId: 'test-fingerprint',
+        userId: TEST_USER_ID,
+        agentTemplate: parentTemplate,
+        sendSubagentChunk: mockSendSubagentChunk,
+        messages: [],
+        agentState,
+      },
+    })
+    await result
+
+    // Verify the streaming messages have consistent agentId and correct agentType
+    expect(mockSendSubagentChunk.mock.calls.length).toBeGreaterThanOrEqual(2)
+    const calls = mockSendSubagentChunk.mock.calls as Array<
+      [
+        {
+          userInputId: string
+          agentId: string
+          agentType: string
+          chunk: string
+          prompt?: string
+        },
+      ]
+    >
+    const firstCall = calls[0][0]
+    const secondCall = calls[1][0]
+
+    expect(firstCall.agentId).toBe(secondCall.agentId) // Same agent ID
+    expect(firstCall.agentType).toBe('thinker')
+    expect(secondCall.agentType).toBe('thinker')
+    expect(firstCall.userInputId).toBe('test-input-123')
+    expect(secondCall.userInputId).toBe('test-input-123')
+  })
+})
@@ -12,9 +12,9 @@ import { asyncAgentManager } from '../../async-agent-manager'
 import { agentRegistry } from '../../templates/agent-registry'
 import { AgentTemplate } from '../../templates/types'
 import { logger } from '../../util/logger'
-import { CodebuffToolCall, CodebuffToolHandlerFunction } from '../constants'
-import { handleSpawnAgents } from './spawn-agents'
 
+import { CodebuffToolCall, CodebuffToolHandlerFunction } from '../constants'
+import { handleSpawnAgents, SendSubagentChunk } from './spawn-agents'
 export const handleSpawnAgentsAsync = ((params: {
   previousToolCallFinished: Promise<void>
   toolCall: CodebuffToolCall<'spawn_agents_async'>
@@ -29,6 +29,7 @@ export const handleSpawnAgentsAsync = ((params: {
     fingerprintId?: string
     userId?: string
     agentTemplate?: AgentTemplate
+    sendSubagentChunk?: SendSubagentChunk
     messages?: CodebuffMessage[]
     agentState?: AgentState
   }
@@ -59,6 +60,7 @@ export const handleSpawnAgentsAsync = ((params: {
     fingerprintId,
     userId,
     agentTemplate: parentAgentTemplate,
+    sendSubagentChunk,
     messages,
   } = state
   let { agentState } = state
@@ -88,6 +90,11 @@ export const handleSpawnAgentsAsync = ((params: {
       'Internal error for spawn_agents: Missing agentState in state'
     )
   }
+  if (!sendSubagentChunk) {
+    throw new Error(
+      'Internal error for spawn_agents_async: Missing sendSubagentChunk in state'
+    )
+  }
 
   // Initialize registry and get all templates
   agentRegistry.initialize(fileContext)
@@ -176,6 +183,7 @@ export const handleSpawnAgentsAsync = ((params: {
           try {
             // Import loopAgentSteps dynamically to avoid circular dependency
             const { loopAgentSteps } = await import('../../run-agent-step')
+
             const result = await loopAgentSteps(ws, {
               userInputId: `${userInputId}-async-${agentType}-${agentId}`,
               prompt: prompt || '',
@@ -187,7 +195,14 @@ export const handleSpawnAgentsAsync = ((params: {
               toolResults: [],
               userId,
               clientSessionId,
-              onResponseChunk: () => {}, // Async agents don't stream to parent
+              onResponseChunk: (chunk: string) =>
+                sendSubagentChunk({
+                  userInputId,
+                  agentId,
+                  agentType,
+                  chunk,
+                  prompt,
+                }),
             })
 
             // Send completion message to parent if agent has appropriate output mode