add stream option

2025-04-17 22:51:51 +01:00 · 2025-04-17 22:51:51 +01:00 · 94ee217e36
parent 36c8fce0f6
commit 94ee217e36
2 changed files with 42 additions and 17 deletions
--- a/backend/agent/api.py
+++ b/backend/agent/api.py
@ -23,6 +23,7 @@ class AgentStartRequest(BaseModel):
    model_name: Optional[str] = "anthropic/claude-3-7-sonnet-latest"
    enable_thinking: Optional[bool] = False
    reasoning_effort: Optional[str] = 'low'
+    stream: Optional[bool] = False # Add stream option, default to False

 # Initialize shared resources
 router = APIRouter()
@ -249,7 +250,7 @@ async def start_agent(
    user_id: str = Depends(get_current_user_id)
 ):
    """Start an agent for a specific thread in the background with dynamic settings."""
-    logger.info(f"Starting new agent for thread: {thread_id} with model: {body.model_name}, thinking: {body.enable_thinking}, effort: {body.reasoning_effort}")
+    logger.info(f"Starting new agent for thread: {thread_id} with model: {body.model_name}, thinking: {body.enable_thinking}, effort: {body.reasoning_effort}, stream: {body.stream}")
    client = await db.client

    # Verify user has access to this thread
@ -311,7 +312,8 @@ async def start_agent(
            project_id=project_id,
            model_name=body.model_name,
            enable_thinking=body.enable_thinking,
-            reasoning_effort=body.reasoning_effort
+            reasoning_effort=body.reasoning_effort,
+            stream=body.stream # Pass stream parameter
        )
    )

@ -446,10 +448,11 @@ async def run_agent_background(
    project_id: str,
    model_name: str, # Add model_name parameter
    enable_thinking: Optional[bool], # Add enable_thinking parameter
-    reasoning_effort: Optional[str] # Add reasoning_effort parameter
+    reasoning_effort: Optional[str], # Add reasoning_effort parameter
+    stream: bool # Add stream parameter
 ):
    """Run the agent in the background and handle status updates."""
-    logger.debug(f"Starting background agent run: {agent_run_id} for thread: {thread_id} (instance: {instance_id}) with model: {model_name}")
+    logger.debug(f"Starting background agent run: {agent_run_id} for thread: {thread_id} (instance: {instance_id}) with model: {model_name}, stream: {stream}")
    client = await db.client

    # Tracking variables
@ -570,7 +573,7 @@ async def run_agent_background(
        agent_gen = run_agent(
            thread_id=thread_id,
            project_id=project_id,
-            stream=True,
+            stream=stream, # Pass stream parameter from API request
            thread_manager=thread_manager,
            model_name=model_name, # Pass model_name
            enable_thinking=enable_thinking, # Pass enable_thinking
--- a/backend/agent/run.py
+++ b/backend/agent/run.py
@ -23,7 +23,7 @@ load_dotenv()
 async def run_agent(
    thread_id: str,
    project_id: str,
-    stream: bool = True,
+    stream: bool, # Accept stream parameter from caller (api.py)
    thread_manager: Optional[ThreadManager] = None,
    native_max_auto_continues: int = 25,
    max_iterations: int = 150,
@ -180,7 +180,7 @@ async def run_agent(
        response = await thread_manager.run_thread(
            thread_id=thread_id,
            system_prompt=system_message, # Pass the constructed message
-            stream=stream,
+            stream=stream, # Pass the stream parameter received by run_agent
            llm_model=model_name, # Use the passed model_name
            llm_temperature=1, # Example temperature
            llm_max_tokens=max_tokens, # Use the determined value
@ -295,7 +295,8 @@ async def test_agent():
        
        if not user_message.strip():
            print("\n🔄 Running agent...\n")
-            await process_agent_response(thread_id, project_id, thread_manager)
+            # Pass stream=True explicitly when calling from test_agent
+            await process_agent_response(thread_id, project_id, thread_manager, stream=True)
            continue
            
        # Add the user message to the thread
@ -310,17 +311,38 @@ async def test_agent():
        )
        
        print("\n🔄 Running agent...\n")
-        await process_agent_response(thread_id, project_id, thread_manager)
+        # Pass stream=True explicitly when calling from test_agent
+        await process_agent_response(thread_id, project_id, thread_manager, stream=True)

    print("\n👋 Test completed. Goodbye!")

-async def process_agent_response(thread_id: str, project_id: str, thread_manager: ThreadManager):
-    """Process the streaming response from the agent."""
+async def process_agent_response(
+    thread_id: str,
+    project_id: str,
+    thread_manager: ThreadManager,
+    stream: bool = True, # Add stream parameter, default to True for testing
+    model_name: str = "anthropic/claude-3-7-sonnet-latest", # Add model_name with default
+    enable_thinking: Optional[bool] = False,             # Add enable_thinking
+    reasoning_effort: Optional[str] = 'low'              # Add reasoning_effort
+):
+    """Process the streaming response from the agent, passing model/thinking parameters."""
    chunk_counter = 0
    current_response = ""
    tool_call_counter = 0  # Track number of tool calls

-    async for chunk in run_agent(thread_id=thread_id, project_id=project_id, stream=True, thread_manager=thread_manager, native_max_auto_continues=25):
+    # Pass the received parameters to the run_agent call
+    agent_generator = run_agent(
+        thread_id=thread_id,
+        project_id=project_id,
+        stream=stream, # Pass the stream parameter here
+        thread_manager=thread_manager,
+        native_max_auto_continues=25,
+        model_name=model_name,
+        enable_thinking=enable_thinking,
+        reasoning_effort=reasoning_effort
+    )
+
+    async for chunk in agent_generator:
        chunk_counter += 1

        if chunk.get('type') == 'content' and 'content' in chunk: