suna/agentpress/thread_manager.py

411 lines
17 KiB
Python
Raw Normal View History

2024-10-06 01:04:15 +08:00
import json
import logging
2024-10-23 10:16:35 +08:00
import os
2024-11-12 19:37:47 +08:00
from typing import List, Dict, Any, Optional, Type, Union, AsyncGenerator
2024-10-10 22:21:39 +08:00
from agentpress.llm import make_llm_api_call
2024-10-23 09:28:12 +08:00
from agentpress.tool import Tool, ToolResult
2024-10-10 22:21:39 +08:00
from agentpress.tool_registry import ToolRegistry
from agentpress.thread_llm_response_processor import StandardLLMResponseProcessor
2024-11-18 06:36:37 +08:00
from agentpress.thread_llm_response_processor import ToolParserBase
from agentpress.thread_llm_response_processor import ToolExecutorBase
from agentpress.thread_llm_response_processor import ResultsAdderBase
2024-10-08 03:13:11 +08:00
import uuid
2024-10-10 22:21:39 +08:00
2024-10-06 01:04:15 +08:00
class ThreadManager:
"""Manages conversation threads with LLM models and tool execution.
The ThreadManager provides comprehensive conversation management, handling
message threading, tool registration, and LLM interactions.
Attributes:
threads_dir (str): Directory for storing thread files
tool_registry (ToolRegistry): Registry for managing available tools
Key Features:
- Thread creation and management
- Message handling with support for text and images
- Tool registration and execution
- LLM interaction with streaming support
- Error handling and cleanup
"""
def __init__(self, threads_dir: str = "threads"):
"""Initialize ThreadManager.
Args:
threads_dir (str): Directory to store thread files
"""
2024-10-23 10:16:35 +08:00
self.threads_dir = threads_dir
2024-10-06 01:04:15 +08:00
self.tool_registry = ToolRegistry()
2024-10-23 10:16:35 +08:00
os.makedirs(self.threads_dir, exist_ok=True)
2024-10-23 09:28:12 +08:00
def add_tool(self, tool_class: Type[Tool], function_names: Optional[List[str]] = None, **kwargs):
2024-10-23 09:28:12 +08:00
"""
Add a tool to the ThreadManager.
If function_names is provided, only register those specific functions.
If function_names is None, register all functions from the tool.
Args:
tool_class: The tool class to register
function_names: Optional list of function names to register
**kwargs: Additional keyword arguments passed to tool initialization
2024-10-23 09:28:12 +08:00
"""
self.tool_registry.register_tool(tool_class, function_names, **kwargs)
2024-10-06 01:04:15 +08:00
2024-10-23 10:16:35 +08:00
async def create_thread(self) -> str:
"""Create a new conversation thread.
Creates a new thread with a unique identifier and initializes its storage.
Returns:
str: Unique thread ID for the created thread
Raises:
IOError: If thread file creation fails
"""
2024-10-23 10:16:35 +08:00
thread_id = str(uuid.uuid4())
thread_path = os.path.join(self.threads_dir, f"{thread_id}.json")
with open(thread_path, 'w') as f:
json.dump({"messages": []}, f)
return thread_id
2024-10-06 01:04:15 +08:00
2024-10-23 10:16:35 +08:00
async def add_message(self, thread_id: str, message_data: Dict[str, Any], images: Optional[List[Dict[str, Any]]] = None):
"""Add a message to an existing thread.
Adds a new message to the specified thread, with support for text content
and image attachments. Handles message cleanup and state management.
Args:
thread_id: ID of the target thread
message_data: Message content and metadata
images: Optional list of image data dictionaries
Raises:
FileNotFoundError: If thread doesn't exist
Exception: For other operation failures
"""
2024-10-06 01:04:15 +08:00
logging.info(f"Adding message to thread {thread_id} with images: {images}")
2024-10-23 10:16:35 +08:00
thread_path = os.path.join(self.threads_dir, f"{thread_id}.json")
try:
with open(thread_path, 'r') as f:
thread_data = json.load(f)
messages = thread_data["messages"]
if message_data['role'] == 'user':
last_assistant_index = next((i for i in reversed(range(len(messages))) if messages[i]['role'] == 'assistant' and 'tool_calls' in messages[i]), None)
2024-10-06 01:04:15 +08:00
2024-10-23 10:16:35 +08:00
if last_assistant_index is not None:
tool_call_count = len(messages[last_assistant_index]['tool_calls'])
tool_response_count = sum(1 for msg in messages[last_assistant_index+1:] if msg['role'] == 'tool')
2024-10-06 01:04:15 +08:00
2024-10-23 10:16:35 +08:00
if tool_call_count != tool_response_count:
await self.cleanup_incomplete_tool_calls(thread_id)
for key, value in message_data.items():
if isinstance(value, ToolResult):
message_data[key] = str(value)
if images:
if isinstance(message_data['content'], str):
message_data['content'] = [{"type": "text", "text": message_data['content']}]
elif not isinstance(message_data['content'], list):
message_data['content'] = []
for image in images:
image_content = {
"type": "image_url",
"image_url": {
"url": f"data:{image['content_type']};base64,{image['base64']}",
"detail": "high"
2024-10-06 01:04:15 +08:00
}
2024-10-23 10:16:35 +08:00
}
message_data['content'].append(image_content)
messages.append(message_data)
thread_data["messages"] = messages
with open(thread_path, 'w') as f:
json.dump(thread_data, f)
logging.info(f"Message added to thread {thread_id}: {message_data}")
except Exception as e:
logging.error(f"Failed to add message to thread {thread_id}: {e}")
raise e
async def list_messages(self, thread_id: str, hide_tool_msgs: bool = False, only_latest_assistant: bool = False, regular_list: bool = True) -> List[Dict[str, Any]]:
"""
Retrieve messages from a thread with optional filtering.
Args:
thread_id (str): ID of the thread to retrieve messages from
hide_tool_msgs (bool): If True, excludes tool messages and tool calls
only_latest_assistant (bool): If True, returns only the most recent assistant message
regular_list (bool): If True, only includes standard message types
Returns:
List[Dict[str, Any]]: List of messages matching the filter criteria
"""
2024-10-23 10:16:35 +08:00
thread_path = os.path.join(self.threads_dir, f"{thread_id}.json")
try:
with open(thread_path, 'r') as f:
thread_data = json.load(f)
messages = thread_data["messages"]
2024-10-06 01:04:15 +08:00
if only_latest_assistant:
for msg in reversed(messages):
if msg.get('role') == 'assistant':
return [msg]
return []
2024-10-23 09:28:12 +08:00
filtered_messages = messages
2024-10-06 01:04:15 +08:00
if hide_tool_msgs:
filtered_messages = [
{k: v for k, v in msg.items() if k != 'tool_calls'}
for msg in filtered_messages
if msg.get('role') != 'tool'
]
if regular_list:
filtered_messages = [
msg for msg in filtered_messages
if msg.get('role') in ['system', 'assistant', 'tool', 'user']
]
return filtered_messages
2024-10-23 10:16:35 +08:00
except FileNotFoundError:
return []
2024-10-06 01:04:15 +08:00
2024-10-23 10:16:35 +08:00
async def cleanup_incomplete_tool_calls(self, thread_id: str):
2024-10-06 01:04:15 +08:00
messages = await self.list_messages(thread_id)
last_assistant_message = next((m for m in reversed(messages) if m['role'] == 'assistant' and 'tool_calls' in m), None)
if last_assistant_message:
tool_calls = last_assistant_message.get('tool_calls', [])
tool_responses = [m for m in messages[messages.index(last_assistant_message)+1:] if m['role'] == 'tool']
if len(tool_calls) != len(tool_responses):
failed_tool_results = []
for tool_call in tool_calls[len(tool_responses):]:
failed_tool_result = {
"role": "tool",
"tool_call_id": tool_call['id'],
"name": tool_call['function']['name'],
"content": "ToolResult(success=False, output='Execution interrupted. Session was stopped.')"
}
failed_tool_results.append(failed_tool_result)
assistant_index = messages.index(last_assistant_message)
messages[assistant_index+1:assistant_index+1] = failed_tool_results
2024-10-23 10:16:35 +08:00
thread_path = os.path.join(self.threads_dir, f"{thread_id}.json")
with open(thread_path, 'w') as f:
json.dump({"messages": messages}, f)
2024-10-06 01:04:15 +08:00
return True
return False
async def run_thread(
2024-11-12 19:37:47 +08:00
self,
thread_id: str,
system_message: Dict[str, Any],
model_name: str,
temperature: float = 0,
max_tokens: Optional[int] = None,
tool_choice: str = "auto",
temporary_message: Optional[Dict[str, Any]] = None,
use_tools: bool = False,
execute_tools: bool = True,
stream: bool = False,
2024-11-12 19:37:47 +08:00
immediate_tool_execution: bool = True,
2024-11-18 06:36:37 +08:00
parallel_tool_execution: bool = True,
tool_parser: Optional[ToolParserBase] = None,
tool_executor: Optional[ToolExecutorBase] = None,
results_adder: Optional[ResultsAdderBase] = None
) -> Union[Dict[str, Any], AsyncGenerator]:
2024-11-18 06:36:37 +08:00
"""Run a conversation thread with specified parameters."""
2024-10-06 01:04:15 +08:00
try:
messages = await self.list_messages(thread_id)
prepared_messages = [system_message] + messages
if temporary_message:
prepared_messages.append(temporary_message)
tools = self.tool_registry.get_all_tool_schemas() if use_tools else None
available_functions = self.tool_registry.get_available_functions() if use_tools else {}
response_processor = StandardLLMResponseProcessor(
2024-11-12 19:37:47 +08:00
thread_id=thread_id,
available_functions=available_functions,
add_message_callback=self.add_message,
update_message_callback=self._update_message,
list_messages_callback=self.list_messages,
parallel_tool_execution=parallel_tool_execution,
2024-11-18 06:36:37 +08:00
threads_dir=self.threads_dir,
tool_parser=tool_parser, # Use provided parser or default to Standard
tool_executor=tool_executor, # Use provided executor or default to Standard
results_adder=results_adder # Use provided adder or default to Standard
2024-11-12 19:37:47 +08:00
)
llm_response = await self._run_thread_completion(
messages=prepared_messages,
model_name=model_name,
2024-11-12 19:37:47 +08:00
temperature=temperature,
2024-10-23 09:28:12 +08:00
max_tokens=max_tokens,
tools=tools,
tool_choice=tool_choice if use_tools else None,
stream=stream
2024-10-17 04:08:46 +08:00
)
if stream:
return response_processor.process_stream(
response_stream=llm_response,
2024-11-12 19:37:47 +08:00
execute_tools=execute_tools,
immediate_execution=immediate_tool_execution
)
await response_processor.process_response(
2024-11-12 19:37:47 +08:00
response=llm_response,
execute_tools=execute_tools
)
return llm_response
2024-10-23 09:28:12 +08:00
except Exception as e:
logging.error(f"Error in run_thread: {str(e)}")
2024-10-08 03:13:11 +08:00
return {
2024-10-23 09:28:12 +08:00
"status": "error",
"message": str(e)
2024-10-08 03:13:11 +08:00
}
2024-10-06 01:04:15 +08:00
async def _run_thread_completion(
self,
messages: List[Dict[str, Any]],
model_name: str,
temperature: float,
max_tokens: Optional[int],
tools: Optional[List[Dict[str, Any]]],
tool_choice: Optional[str],
stream: bool
) -> Union[Any, AsyncGenerator]:
"""Get completion from LLM API."""
return await make_llm_api_call(
messages,
model_name,
temperature=temperature,
max_tokens=max_tokens,
tools=tools,
tool_choice=tool_choice,
stream=stream
)
async def _update_message(self, thread_id: str, message: Dict[str, Any]):
"""Update an existing message in the thread."""
thread_path = os.path.join(self.threads_dir, f"{thread_id}.json")
try:
with open(thread_path, 'r') as f:
thread_data = json.load(f)
# Find and update the last assistant message
for i in reversed(range(len(thread_data["messages"]))):
if thread_data["messages"][i]["role"] == "assistant":
thread_data["messages"][i] = message
break
with open(thread_path, 'w') as f:
json.dump(thread_data, f)
except Exception as e:
logging.error(f"Error updating message in thread {thread_id}: {e}")
raise e
2024-10-23 09:28:12 +08:00
if __name__ == "__main__":
import asyncio
from agentpress.examples.example_agent.tools.files_tool import FilesTool
2024-10-06 01:04:15 +08:00
2024-10-23 09:28:12 +08:00
async def main():
2024-11-12 19:53:07 +08:00
# Initialize managers
thread_manager = ThreadManager()
# Register available tools
thread_manager.add_tool(FilesTool)
# Create a new thread
thread_id = await thread_manager.create_thread()
2024-10-23 09:28:12 +08:00
# Add a test message
2024-11-12 19:53:07 +08:00
await thread_manager.add_message(thread_id, {
"role": "user",
"content": "Please create 10x files Each should be a chapter of a book about an Introduction to Robotics.."
})
2024-11-12 19:53:07 +08:00
# Define system message
system_message = {
"role": "system",
"content": "You are a helpful assistant that can create, read, update, and delete files."
}
2024-10-10 22:21:39 +08:00
2024-11-12 19:53:07 +08:00
# Test with streaming response and tool execution
print("\n🤖 Testing streaming response with tools:")
response = await thread_manager.run_thread(
2024-10-23 09:28:12 +08:00
thread_id=thread_id,
system_message=system_message,
2024-11-12 19:53:07 +08:00
model_name="anthropic/claude-3-5-haiku-latest",
2024-10-23 09:28:12 +08:00
temperature=0.7,
2024-11-12 19:53:07 +08:00
max_tokens=4096,
stream=True,
use_tools=True,
2024-11-12 19:53:07 +08:00
execute_tools=True,
immediate_tool_execution=True,
2024-11-12 19:54:53 +08:00
parallel_tool_execution=True
2024-10-23 09:28:12 +08:00
)
2024-10-10 22:21:39 +08:00
2024-11-12 19:53:07 +08:00
# Handle streaming response
if isinstance(response, AsyncGenerator):
print("\nAssistant is responding:")
content_buffer = ""
try:
async for chunk in response:
if hasattr(chunk.choices[0], 'delta'):
delta = chunk.choices[0].delta
# Handle content streaming
if hasattr(delta, 'content') and delta.content is not None:
content_buffer += delta.content
if delta.content.endswith((' ', '\n')):
print(content_buffer, end='', flush=True)
content_buffer = ""
# Handle tool calls
if hasattr(delta, 'tool_calls') and delta.tool_calls:
for tool_call in delta.tool_calls:
# Print tool name when it first appears
if tool_call.function and tool_call.function.name:
print(f"\n🛠️ Tool Call: {tool_call.function.name}", flush=True)
# Print arguments as they stream in
if tool_call.function and tool_call.function.arguments:
print(f" {tool_call.function.arguments}", end='', flush=True)
# Print any remaining content
if content_buffer:
print(content_buffer, flush=True)
print("\n✨ Response completed\n")
except Exception as e:
print(f"\n❌ Error processing stream: {e}")
else:
print("\n✨ Response completed\n")
# Display final thread state
messages = await thread_manager.list_messages(thread_id)
print("\n📝 Final Thread State:")
for msg in messages:
role = msg.get('role', 'unknown')
content = msg.get('content', '')
print(f"\n{role.upper()}: {content[:100]}...")
2024-10-06 01:04:15 +08:00
2024-10-23 09:28:12 +08:00
asyncio.run(main())