suna/agentpress/response_processor.py

import logging
from typing import Dict, Any, AsyncGenerator, Callable
from agentpress.tool_parser import ToolParser
from agentpress.tool_executor import ToolExecutor
import asyncio

class LLMResponseProcessor:
    """
    Handles LLM response processing and tool execution management.
    
    This class manages both streaming and non-streaming responses from Language Models,
    coordinating tool execution timing and order. It maintains message state and handles
    the execution of tool calls either immediately or after collecting a complete response,
    with support for both parallel and sequential execution patterns.
    
    Attributes:
        thread_id (str): Identifier for the conversation thread
        tool_executor (ToolExecutor): Executor for handling tool calls
        tool_parser (ToolParser): Parser for processing LLM responses
        available_functions (Dict): Registry of available tool functions
        add_message (Callable): Callback to add messages to the thread
        update_message (Callable): Callback to update existing messages
        parallel_tool_execution (bool): Whether to execute tools in parallel or sequentially
        tool_calls_buffer (Dict): Buffer for storing incomplete tool calls during streaming
        processed_tool_calls (set): Set of already processed tool call IDs
        current_message (Dict): Current message being processed in streaming mode
        content_buffer (str): Buffer for accumulating content during streaming
        tool_calls_accumulated (list): List of tool calls accumulated during streaming
        message_added (bool): Flag to indicate if a message has been added to the thread
    """
    
    def __init__(
        self,
        thread_id: str,
        tool_executor: ToolExecutor,
        tool_parser: ToolParser,
        available_functions: Dict,
        add_message_callback: Callable,
        update_message_callback: Callable
    ):
        self.thread_id = thread_id
        self.tool_executor = tool_executor
        self.tool_parser = tool_parser
        self.available_functions = available_functions
        self.add_message = add_message_callback
        self.update_message = update_message_callback
        
        # State tracking for streaming responses
        self.tool_calls_buffer = {}
        self.processed_tool_calls = set()
        self.content_buffer = ""
        self.tool_calls_accumulated = []
        self.message_added = False

    async def process_stream(
        self,
        response_stream: AsyncGenerator,
        execute_tools: bool = True,
        immediate_execution: bool = True 
    ) -> AsyncGenerator:
        """
        Process streaming LLM response and handle tool execution.
        
        Yields chunks immediately as they arrive, while handling tool execution
        and message management in the background.
        """
        pending_tool_calls = []

        async def handle_message_management(chunk):
            # Accumulate content
            if hasattr(chunk.choices[0].delta, 'content') and chunk.choices[0].delta.content:
                self.content_buffer += chunk.choices[0].delta.content
            
            # Parse and accumulate tool calls
            parsed_message, is_complete = await self.tool_parser.parse_stream(
                chunk, 
                self.tool_calls_buffer
            )
            if parsed_message and 'tool_calls' in parsed_message:
                self.tool_calls_accumulated = parsed_message['tool_calls']

            # Handle message management and tool execution
            if chunk.choices[0].finish_reason or (self.content_buffer and self.tool_calls_accumulated):
                message = {
                    "role": "assistant",
                    "content": self.content_buffer
                }
                if self.tool_calls_accumulated:
                    message["tool_calls"] = self.tool_calls_accumulated

                if not self.message_added:
                    await self.add_message(self.thread_id, message)
                    self.message_added = True
                else:
                    await self.update_message(self.thread_id, message)

                # Handle tool execution
                if execute_tools and self.tool_calls_accumulated:
                    new_tool_calls = [
                        tool_call for tool_call in self.tool_calls_accumulated
                        if tool_call['id'] not in self.processed_tool_calls
                    ]

                    if new_tool_calls:
                        if immediate_execution:
                            results = await self.tool_executor.execute_tool_calls(
                                tool_calls=new_tool_calls,
                                available_functions=self.available_functions,
                                thread_id=self.thread_id,
                                executed_tool_calls=self.processed_tool_calls
                            )
                            for result in results:
                                await self.add_message(self.thread_id, result)
                                self.processed_tool_calls.add(result['tool_call_id'])
                        else:
                            pending_tool_calls.extend(new_tool_calls)

            # Handle end of stream
            if chunk.choices[0].finish_reason:
                if not immediate_execution and pending_tool_calls:
                    results = await self.tool_executor.execute_tool_calls(
                        tool_calls=pending_tool_calls,
                        available_functions=self.available_functions,
                        thread_id=self.thread_id,
                        executed_tool_calls=self.processed_tool_calls
                    )
                    for result in results:
                        await self.add_message(self.thread_id, result)
                        self.processed_tool_calls.add(result['tool_call_id'])
                    pending_tool_calls.clear()

        async for chunk in response_stream:
            # Start background task for message management and tool execution
            asyncio.create_task(handle_message_management(chunk))
            # Immediately yield the chunk
            yield chunk

    async def process_response(
        self,
        response: Any,
        execute_tools: bool = True
    ) -> None:
        """
        Process complete LLM response and execute tools.
        
        Handles non-streaming responses, parsing the complete response and
        executing any tool calls according to the configured execution strategy.
        
        Args:
            response: Complete response from the LLM
            execute_tools: Whether to execute identified tool calls
        """
        try:
            assistant_message = await self.tool_parser.parse_response(response)
            await self.add_message(self.thread_id, assistant_message)

            if execute_tools and 'tool_calls' in assistant_message and assistant_message['tool_calls']:
                results = await self.tool_executor.execute_tool_calls(
                    tool_calls=assistant_message['tool_calls'],
                    available_functions=self.available_functions,
                    thread_id=self.thread_id,
                    executed_tool_calls=self.processed_tool_calls
                )
                
                for result in results:
                    await self.add_message(self.thread_id, result)
                    logging.info(f"Tool execution result: {result}")
        
        except Exception as e:
            logging.error(f"Error processing response: {e}")
            response_content = response.choices[0].message.get('content', '')
            await self.add_message(self.thread_id, {
                "role": "assistant", 
                "content": response_content or ""
            })
wip 2024-11-12 19:53:07 +08:00			`import logging`
refactor 2024-11-12 19:37:47 +08:00			`from typing import Dict, Any, AsyncGenerator, Callable`
			`from agentpress.tool_parser import ToolParser`
instant stream 2024-11-13 07:57:38 +08:00			`from agentpress.tool_executor import ToolExecutor`
			`import asyncio`
refactor 2024-11-12 19:37:47 +08:00
			`class LLMResponseProcessor:`
			`"""`
			`Handles LLM response processing and tool execution management.`

			`This class manages both streaming and non-streaming responses from Language Models,`
			`coordinating tool execution timing and order. It maintains message state and handles`
			`the execution of tool calls either immediately or after collecting a complete response,`
			`with support for both parallel and sequential execution patterns.`

			`Attributes:`
			`thread_id (str): Identifier for the conversation thread`
			`tool_executor (ToolExecutor): Executor for handling tool calls`
			`tool_parser (ToolParser): Parser for processing LLM responses`
			`available_functions (Dict): Registry of available tool functions`
			`add_message (Callable): Callback to add messages to the thread`
			`update_message (Callable): Callback to update existing messages`
			`parallel_tool_execution (bool): Whether to execute tools in parallel or sequentially`
			`tool_calls_buffer (Dict): Buffer for storing incomplete tool calls during streaming`
			`processed_tool_calls (set): Set of already processed tool call IDs`
			`current_message (Dict): Current message being processed in streaming mode`
instant stream 2024-11-13 07:57:38 +08:00			`content_buffer (str): Buffer for accumulating content during streaming`
			`tool_calls_accumulated (list): List of tool calls accumulated during streaming`
			`message_added (bool): Flag to indicate if a message has been added to the thread`
refactor 2024-11-12 19:37:47 +08:00			`"""`

			`def __init__(`
			`self,`
			`thread_id: str,`
			`tool_executor: ToolExecutor,`
			`tool_parser: ToolParser,`
			`available_functions: Dict,`
			`add_message_callback: Callable,`
			`update_message_callback: Callable`
			`):`
			`self.thread_id = thread_id`
			`self.tool_executor = tool_executor`
			`self.tool_parser = tool_parser`
			`self.available_functions = available_functions`
			`self.add_message = add_message_callback`
			`self.update_message = update_message_callback`

			`# State tracking for streaming responses`
			`self.tool_calls_buffer = {}`
			`self.processed_tool_calls = set()`
instant stream 2024-11-13 07:57:38 +08:00			`self.content_buffer = ""`
			`self.tool_calls_accumulated = []`
			`self.message_added = False`
refactor 2024-11-12 19:37:47 +08:00
			`async def process_stream(`
			`self,`
			`response_stream: AsyncGenerator,`
			`execute_tools: bool = True,`
wip 2024-11-12 19:53:07 +08:00			`immediate_execution: bool = True`
refactor 2024-11-12 19:37:47 +08:00			`) -> AsyncGenerator:`
			`"""`
			`Process streaming LLM response and handle tool execution.`

instant stream 2024-11-13 07:57:38 +08:00			`Yields chunks immediately as they arrive, while handling tool execution`
			`and message management in the background.`
refactor 2024-11-12 19:37:47 +08:00			`"""`
			`pending_tool_calls = []`

instant stream 2024-11-13 07:57:38 +08:00			`async def handle_message_management(chunk):`
			`# Accumulate content`
			`if hasattr(chunk.choices[0].delta, 'content') and chunk.choices[0].delta.content:`
			`self.content_buffer += chunk.choices[0].delta.content`

			`# Parse and accumulate tool calls`
refactor 2024-11-12 19:37:47 +08:00			`parsed_message, is_complete = await self.tool_parser.parse_stream(`
			`chunk,`
			`self.tool_calls_buffer`
			`)`
			`if parsed_message and 'tool_calls' in parsed_message:`
instant stream 2024-11-13 07:57:38 +08:00			`self.tool_calls_accumulated = parsed_message['tool_calls']`

			`# Handle message management and tool execution`
			`if chunk.choices[0].finish_reason or (self.content_buffer and self.tool_calls_accumulated):`
			`message = {`
			`"role": "assistant",`
			`"content": self.content_buffer`
			`}`
			`if self.tool_calls_accumulated:`
			`message["tool_calls"] = self.tool_calls_accumulated`

			`if not self.message_added:`
			`await self.add_message(self.thread_id, message)`
			`self.message_added = True`
refactor 2024-11-12 19:37:47 +08:00			`else:`
instant stream 2024-11-13 07:57:38 +08:00			`await self.update_message(self.thread_id, message)`
refactor 2024-11-12 19:37:47 +08:00
instant stream 2024-11-13 07:57:38 +08:00			`# Handle tool execution`
			`if execute_tools and self.tool_calls_accumulated:`
refactor 2024-11-12 19:37:47 +08:00			`new_tool_calls = [`
instant stream 2024-11-13 07:57:38 +08:00			`tool_call for tool_call in self.tool_calls_accumulated`
refactor 2024-11-12 19:37:47 +08:00			`if tool_call['id'] not in self.processed_tool_calls`
			`]`

			`if new_tool_calls:`
			`if immediate_execution:`
			`results = await self.tool_executor.execute_tool_calls(`
			`tool_calls=new_tool_calls,`
			`available_functions=self.available_functions,`
			`thread_id=self.thread_id,`
			`executed_tool_calls=self.processed_tool_calls`
			`)`
			`for result in results:`
			`await self.add_message(self.thread_id, result)`
			`self.processed_tool_calls.add(result['tool_call_id'])`
			`else:`
			`pending_tool_calls.extend(new_tool_calls)`

instant stream 2024-11-13 07:57:38 +08:00			`# Handle end of stream`
			`if chunk.choices[0].finish_reason:`
			`if not immediate_execution and pending_tool_calls:`
			`results = await self.tool_executor.execute_tool_calls(`
			`tool_calls=pending_tool_calls,`
			`available_functions=self.available_functions,`
			`thread_id=self.thread_id,`
			`executed_tool_calls=self.processed_tool_calls`
			`)`
			`for result in results:`
			`await self.add_message(self.thread_id, result)`
			`self.processed_tool_calls.add(result['tool_call_id'])`
			`pending_tool_calls.clear()`
refactor 2024-11-12 19:37:47 +08:00
			`async for chunk in response_stream:`
instant stream 2024-11-13 07:57:38 +08:00			`# Start background task for message management and tool execution`
			`asyncio.create_task(handle_message_management(chunk))`
			`# Immediately yield the chunk`
			`yield chunk`
refactor 2024-11-12 19:37:47 +08:00
			`async def process_response(`
			`self,`
			`response: Any,`
			`execute_tools: bool = True`
			`) -> None:`
			`"""`
			`Process complete LLM response and execute tools.`

			`Handles non-streaming responses, parsing the complete response and`
			`executing any tool calls according to the configured execution strategy.`

			`Args:`
			`response: Complete response from the LLM`
			`execute_tools: Whether to execute identified tool calls`
			`"""`
			`try:`
			`assistant_message = await self.tool_parser.parse_response(response)`
			`await self.add_message(self.thread_id, assistant_message)`

			`if execute_tools and 'tool_calls' in assistant_message and assistant_message['tool_calls']:`
			`results = await self.tool_executor.execute_tool_calls(`
			`tool_calls=assistant_message['tool_calls'],`
			`available_functions=self.available_functions,`
			`thread_id=self.thread_id,`
			`executed_tool_calls=self.processed_tool_calls`
			`)`

			`for result in results:`
			`await self.add_message(self.thread_id, result)`
			`logging.info(f"Tool execution result: {result}")`

			`except Exception as e:`
			`logging.error(f"Error processing response: {e}")`
			`response_content = response.choices[0].message.get('content', '')`
			`await self.add_message(self.thread_id, {`
			`"role": "assistant",`
			`"content": response_content or ""`
			`})`