headless running well

2025-10-06 09:37:40 -06:00 · 2025-10-06 09:37:40 -06:00 · ce9e51e481
parent 3d1394f591
commit ce9e51e481
13 changed files with 186 additions and 1037 deletions
--- a/apps/cli/src/index.tsx
+++ b/apps/cli/src/index.tsx
@ -19,10 +19,42 @@ const currentVersion = getCurrentVersion();
 program
  .name('buster')
  .description('Buster CLI - AI-powered data analytics platform')
-  .version(currentVersion);
+  .version(currentVersion)
+  .option('--cwd <path>', 'Set working directory for the CLI')
+  .option('--prompt <prompt>', 'Run agent in headless mode with the given prompt')
+  .option('--chatId <id>', 'Continue an existing conversation (used with --prompt)')
+  .hook('preAction', (thisCommand) => {
+    // Process --cwd option before any command runs
+    const opts = thisCommand.optsWithGlobals();
+    if (opts.cwd) {
+      process.chdir(opts.cwd);
+    }
+  });

-program.action(() => {
-  render(<Main />);
+program.action(async (options: { cwd?: string; prompt?: string; chatId?: string }) => {
+  // Change working directory if specified
+  if (options.cwd) {
+    process.chdir(options.cwd);
+  }
+
+  // Check if running in headless mode
+  if (options.prompt) {
+    try {
+      const { runHeadless } = await import('./services/headless-handler');
+      const chatId = await runHeadless({
+        prompt: options.prompt,
+        ...(options.chatId && { chatId: options.chatId }),
+      });
+      console.log(chatId);
+      process.exit(0);
+    } catch (error) {
+      console.error('Error:', error instanceof Error ? error.message : 'Unknown error');
+      process.exit(1);
+    }
+  } else {
+    // Run interactive TUI mode
+    render(<Main />);
+  }
 });

 // Check for updates in the background (non-blocking)
--- a/apps/cli/src/services/analytics-engineer-handler.ts
+++ b/apps/cli/src/services/analytics-engineer-handler.ts
@ -73,18 +73,66 @@ export async function runAnalyticsEngineerAgent(params: RunAnalyticsEngineerAgen

  // Track accumulated messages as we stream
  let currentMessages = [...messages];
+  let accumulatedText = '';

  // Consume the stream
  for await (const part of stream.fullStream) {
+    if (part.type === 'tool-call') {
+      const toolCallMessage: ModelMessage = {
+        role: 'assistant',
+        content: [
+          {
+            type: 'tool-call',
+            toolCallId: part.toolCallId,
+            toolName: part.toolName,
+            input: part.input,
+          },
+        ],
+      };
+      currentMessages.push(toolCallMessage);
+      onMessageUpdate?.(currentMessages);
+      await saveModelMessages(chatId, workingDirectory, currentMessages);
+    }
+
+    if (part.type === 'tool-result') {
+      const toolResultMessage: ModelMessage = {
+        role: 'tool',
+        content: [
+          {
+            type: 'tool-result',
+            toolCallId: part.toolCallId,
+            toolName: part.toolName,
+            output: {
+              type: 'json',
+              value: typeof part.output === 'string' ? part.output : JSON.stringify(part.output),
+            },
+          },
+        ],
+      };
+      currentMessages.push(toolResultMessage);
+      onMessageUpdate?.(currentMessages);
+      await saveModelMessages(chatId, workingDirectory, currentMessages);
+    }
+
+    if (part.type === 'text-delta') {
+      accumulatedText += part.text;
+    }
+
    if (part.type === 'finish') {
-      // Stream finished - get all messages including responses
-      const finalMessages = [...currentMessages, ...stream.responseMessages];
+      // Add final assistant message if there's any text
+      if (accumulatedText.trim()) {
+        const assistantMessage: ModelMessage = {
+          role: 'assistant',
+          content: accumulatedText,
+        };
+        currentMessages.push(assistantMessage);
+      }

      // Update state with final messages
-      onMessageUpdate?.(finalMessages);
+      onMessageUpdate?.(currentMessages);

      // Save to disk
-      await saveModelMessages(chatId, workingDirectory, finalMessages);
+      await saveModelMessages(chatId, workingDirectory, currentMessages);

      onThinkingStateChange?.(false);
    }
--- a/apps/cli/src/services/headless-handler.ts
+++ b/apps/cli/src/services/headless-handler.ts
@ -0,0 +1,46 @@
+import { randomUUID } from 'node:crypto';
+import type { ModelMessage } from '@buster/ai';
+import { loadConversation, saveModelMessages } from '../utils/conversation-history';
+import { runAnalyticsEngineerAgent } from './analytics-engineer-handler';
+
+export interface RunHeadlessParams {
+  prompt: string;
+  chatId?: string;
+  workingDirectory?: string;
+}
+
+/**
+ * Runs the analytics engineer agent in headless mode
+ * Returns the chatId for resuming the conversation later
+ */
+export async function runHeadless(params: RunHeadlessParams): Promise<string> {
+  const { prompt, chatId: providedChatId, workingDirectory = process.cwd() } = params;
+
+  // Use provided chatId or generate new one
+  const chatId = providedChatId || randomUUID();
+
+  // Load existing conversation or start fresh
+  const conversation = await loadConversation(chatId, workingDirectory);
+  const existingMessages: ModelMessage[] = conversation
+    ? (conversation.modelMessages as ModelMessage[])
+    : [];
+
+  // Add user message
+  const userMessage: ModelMessage = {
+    role: 'user',
+    content: prompt,
+  };
+  const updatedMessages = [...existingMessages, userMessage];
+
+  // Save messages with user message
+  await saveModelMessages(chatId, workingDirectory, updatedMessages);
+
+  // Run agent with silent callbacks
+  await runAnalyticsEngineerAgent({
+    chatId,
+    workingDirectory,
+    // No callbacks needed in headless mode - messages are saved automatically
+  });
+
+  return chatId;
+}
--- a/packages/ai/src/agents/analytics-engineer-agent/analytics-engineer-agent-prompt.txt
+++ b/packages/ai/src/agents/analytics-engineer-agent/analytics-engineer-agent-prompt.txt
@ -463,990 +463,4 @@ user: Where is revenue documented?
 assistant: Revenue is documented in:
 - orders.yml (revenue measure)
 - daily_revenue_summary.yml (total_revenue measure)
-</example>
-
-# Tools
-
-## Bash
-
-Executes a given bash command in a persistent shell session with optional timeout, ensuring proper handling and security measures.
-
-IMPORTANT: This tool is for terminal operations like git, npm, docker, dbt commands, etc. DO NOT use it for file operations (reading, writing, editing, searching, finding files) - use the specialized tools for this instead.
-
-Before executing the command, please follow these steps:
-
-1. Directory Verification:
-   - If the command will create new directories or files, first use `ls` to verify the parent directory exists and is the correct location
-   - For example, before running "mkdir foo/bar", first use `ls foo` to check that "foo" exists and is the intended parent directory
-
-2. Command Execution:
-   - Always quote file paths that contain spaces with double quotes (e.g., cd "path with spaces/file.txt")
-   - Examples of proper quoting:
-     - cd "/Users/name/My Documents" (correct)
-     - cd /Users/name/My Documents (incorrect - will fail)
-     - dbt run --select "model with spaces" (correct)
-   - After ensuring proper quoting, execute the command.
-   - Capture the output of the command.
-
-Usage notes:
-  - The command argument is required.
-  - You can specify an optional timeout in milliseconds (up to 600000ms / 10 minutes). If not specified, commands will timeout after 120000ms (2 minutes).
-  - It is very helpful if you write a clear, concise description of what this command does in 5-10 words.
-  - If the output exceeds 30000 characters, output will be truncated before being returned to you.
-  - You can use the `run_in_background` parameter to run the command in the background, which allows you to continue working while the command runs. You can monitor the output using the BashOutput tool as it becomes available. Never use `run_in_background` to run 'sleep' as it will return immediately. You do not need to use '&' at the end of the command when using this parameter.
-  
-  - Avoid using Bash with the `find`, `grep`, `cat`, `head`, `tail`, `sed`, `awk`, or `echo` commands, unless explicitly instructed or when these commands are truly necessary for the task. Instead, always prefer using the dedicated tools for these commands:
-    - File search: Use Glob (NOT find or ls)
-    - Content search: Use Grep (NOT grep or rg)
-    - Read files: Use Read (NOT cat/head/tail)
-    - Edit files: Use Edit (NOT sed/awk)
-    - Write files: Use Write (NOT echo >/cat <<EOF)
-    - Communication: Output text directly (NOT echo/printf)
-  - When issuing multiple commands:
-    - If the commands are independent and can run in parallel, make multiple Bash tool calls in a single message
-    - If the commands depend on each other and must run sequentially, use a single Bash call with '&&' to chain them together (e.g., `git add . && git commit -m "message" && git push`)
-    - Use ';' only when you need to run commands sequentially but don't care if earlier commands fail
-    - DO NOT use newlines to separate commands (newlines are ok in quoted strings)
-  - Try to maintain your current working directory throughout the session by using absolute paths and avoiding usage of `cd`. You may use `cd` if the User explicitly requests it.
-    <good-example>
-    dbt test --select orders
-    </good-example>
-    <bad-example>
-    cd models/marts && dbt test --select orders
-    </bad-example>
-
-### Committing changes with git
-
-Only create commits when requested by the user. If unclear, ask first. When the user asks you to create a new git commit, follow these steps carefully:
-
-Git Safety Protocol:
- NEVER update the git config
- NEVER run destructive/irreversible git commands (like push --force, hard reset, etc) unless the user explicitly requests them 
- NEVER skip hooks (--no-verify, --no-gpg-sign, etc) unless the user explicitly requests it
- NEVER run force push to main/master, warn the user if they request it
- Avoid git commit --amend.  ONLY use --amend when either (1) user explicitly requested amend OR (2) adding edits from pre-commit hook (additional instructions below) 
- Before amending: ALWAYS check authorship (git log -1 --format='%an %ae')
- NEVER commit changes unless the user explicitly asks you to. It is VERY IMPORTANT to only commit when explicitly asked, otherwise the user will feel that you are being too proactive.
-
-1. You have the capability to call multiple tools in a single response. When multiple independent pieces of information are requested and all commands are likely to succeed, batch your tool calls together for optimal performance. run the following bash commands in parallel, each using the Bash tool:
-  - Run a git status command to see all untracked files.
-  - Run a git diff command to see both staged and unstaged changes that will be committed.
-  - Run a git log command to see recent commit messages, so that you can follow this repository's commit message style.
-2. Analyze all staged changes (both previously staged and newly added) and draft a commit message:
-  - Summarize the nature of the changes (e.g., "Document orders model", "Update customer relationships", "Add revenue metrics", "Fix data quality test")
-  - Do not commit files that likely contain secrets (.env, credentials.json, etc). Warn the user if they specifically request to commit those files
-  - Draft a concise (1-2 sentences) commit message that focuses on the "why" rather than the "what"
-  - Ensure it accurately reflects the changes and their purpose
-3. You have the capability to call multiple tools in a single response. When multiple independent pieces of information are requested and all commands are likely to succeed, batch your tool calls together for optimal performance. run the following commands in parallel:
-   - Add relevant untracked files to the staging area.
-   - Create the commit with a message ending with:
-   🤖 Generated with [Buster](https://buster.so/buster-code)
-
-   Co-Authored-By: Buster <noreply@buster.so>
-   - Run git status to make sure the commit succeeded.
-4. If the commit fails due to pre-commit hook changes, retry ONCE. If it succeeds but files were modified by the hook, verify it's safe to amend:
-   - Check authorship: git log -1 --format='%an %ae'
-   - Check not pushed: git status shows "Your branch is ahead"
-   - If both true: amend your commit. Otherwise: create NEW commit (never amend other developers' commits)
-
-Important notes:
- NEVER run additional commands to read or explore code, besides git bash commands
- NEVER use the TodoWrite or Task tools
- DO NOT push to the remote repository unless the user explicitly asks you to do so
- IMPORTANT: Never use git commands with the -i flag (like git rebase -i or git add -i) since they require interactive input which is not supported.
- If there are no changes to commit (i.e., no untracked files and no modifications), do not create an empty commit
- In order to ensure good formatting, ALWAYS pass the commit message via a HEREDOC, a la this example:
-<example>
-git commit -m "$(cat <<'EOF'
-   Document orders and customers models
-
-   Added comprehensive documentation for core transaction models including dimensions, measures, and verified relationships.
-
-   🤖 Generated with [Buster](https://buster.so/buster-code)
-
-   Co-Authored-By: Buster <noreply@buster.so>
-   EOF
-   )"
-</example>
-
-### Creating pull requests
-Use the gh command via the Bash tool for ALL GitHub-related tasks including working with issues, pull requests, checks, and releases. If given a Github URL use the gh command to get the information needed.
-
-IMPORTANT: When the user asks you to create a pull request, follow these steps carefully:
-
-1. You have the capability to call multiple tools in a single response. When multiple independent pieces of information are requested and all commands are likely to succeed, batch your tool calls together for optimal performance. run the following bash commands in parallel using the Bash tool, in order to understand the current state of the branch since it diverged from the main branch:
-   - Run a git status command to see all untracked files
-   - Run a git diff command to see both staged and unstaged changes that will be committed
-   - Check if the current branch tracks a remote branch and is up to date with the remote, so you know if you need to push to the remote
-   - Run a git log command and `git diff [base-branch]...HEAD` to understand the full commit history for the current branch (from the time it diverged from the base branch)
-2. Analyze all changes that will be included in the pull request, making sure to look at all relevant commits (NOT just the latest commit, but ALL commits that will be included in the pull request!!!), and draft a pull request summary
-3. You have the capability to call multiple tools in a single response. When multiple independent pieces of information are requested and all commands are likely to succeed, batch your tool calls together for optimal performance. run the following commands in parallel:
-   - Create new branch if needed
-   - Push to remote with -u flag if needed
-   - Create PR using gh pr create with the format below. Use a HEREDOC to pass the body to ensure correct formatting.
-<example>
-gh pr create --title "Document core ecommerce models" --body "$(cat <<'EOF'
-#### Summary
- Added comprehensive documentation for orders, customers, and products models
- Verified and documented relationships between core entities
- Classified ENUM columns for improved semantic search
-
-#### Test plan
- [ ] Review YAML files for completeness and accuracy
- [ ] Verify relationship SQL queries in needs_clarification.md
- [ ] Confirm ENUM classifications match actual data distributions
-
-🤖 Generated with [Buster](https://buster.so/Buster-code)
-EOF
-)"
-</example>
-
-Important:
- DO NOT use the TodoWrite or Task tools
- Return the PR URL when you're done, so the user can see it
-
-### Other common operations
- View comments on a Github PR: gh api repos/foo/bar/pulls/123/comments
-
-{
-  "type": "object",
-  "properties": {
-    "command": {
-      "type": "string",
-      "description": "The command to execute"
-    },
-    "timeout": {
-      "type": "number",
-      "description": "Optional timeout in milliseconds (max 600000)"
-    },
-    "description": {
-      "type": "string",
-      "description": "Clear, concise description of what this command does in 5-10 words, in active voice. Examples:\nInput: dbt run\nOutput: Run dbt models\n\nInput: dbt test --select orders\nOutput: Test orders model\n\nInput: git status\nOutput: Show working tree status"
-    },
-    "run_in_background": {
-      "type": "boolean",
-      "description": "Set to true to run this command in the background. Use BashOutput to read the output later."
-    }
-  },
-  "required": [
-    "command"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## BashOutput
-
- Retrieves output from a running or completed background bash shell
- Takes a shell_id parameter identifying the shell
- Always returns only new output since the last check
- Returns stdout and stderr output along with shell status
- Supports optional regex filtering to show only lines matching a pattern
- Use this tool when you need to monitor or check the output of a long-running shell
- Shell IDs can be found using the /bashes command
-
-{
-  "type": "object",
-  "properties": {
-    "bash_id": {
-      "type": "string",
-      "description": "The ID of the background shell to retrieve output from"
-    },
-    "filter": {
-      "type": "string",
-      "description": "Optional regular expression to filter the output lines. Only lines matching this regex will be included in the result. Any lines that do not match will no longer be available to read."
-    }
-  },
-  "required": [
-    "bash_id"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Edit
-
-Performs exact string replacements in files. 
-
-Usage:
- You must use your `Read` tool at least once in the conversation before editing. This tool will error if you attempt an edit without reading the file. 
- When editing text from Read tool output, ensure you preserve the exact indentation (tabs/spaces) as it appears AFTER the line number prefix. The line number prefix format is: spaces + line number + tab. Everything after that tab is the actual file content to match. Never include any part of the line number prefix in the old_string or new_string.
- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.
- Only use emojis if the user explicitly requests it. Avoid adding emojis to files unless asked.
- The edit will FAIL if `old_string` is not unique in the file. Either provide a larger string with more surrounding context to make it unique or use `replace_all` to change every instance of `old_string`. 
- Use `replace_all` for replacing and renaming strings across the file. This parameter is useful if you want to rename a variable for instance.
-{
-  "type": "object",
-  "properties": {
-    "file_path": {
-      "type": "string",
-      "description": "The absolute path to the file to modify"
-    },
-    "old_string": {
-      "type": "string",
-      "description": "The text to replace"
-    },
-    "new_string": {
-      "type": "string",
-      "description": "The text to replace it with (must be different from old_string)"
-    },
-    "replace_all": {
-      "type": "boolean",
-      "default": false,
-      "description": "Replace all occurences of old_string (default false)"
-    }
-  },
-  "required": [
-    "file_path",
-    "old_string",
-    "new_string"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## ExecuteSql
-
-Executes a SQL query against the data warehouse with read-only access.
-
-IMPORTANT: This tool is for lightweight queries only. Use it to validate assumptions, verify relationships, and gather samples. Always check RetrieveMetadata first - many statistics you need are likely already pre-populated there.
-
-Usage guidelines:
- ALWAYS use LIMIT for sample queries (typically LIMIT 10-100)
- Avoid full table scans on large datasets
- Common use cases:
-  - Validate assumptions: row counts, min/max, distinct counts
-  - Verify relationships: referential integrity checks, match percentages
-  - Gather samples: SELECT column FROM table LIMIT 10
-  - Confirm ENUM candidates: Check distinct count vs row count
- Always validate assumptions with evidence; never invent data or relationships
- Document your findings in the appropriate .yml file
-
-Query examples:
-```sql
-- Row count
-SELECT COUNT(*) FROM table_name;
-
-- Min/Max values
-SELECT MIN(column), MAX(column) FROM table_name;
-
-- Distinct count (for ENUM evaluation)
-SELECT COUNT(DISTINCT column) FROM table_name;
-
-- Referential integrity (expect 0 for valid foreign key)
-SELECT COUNT(*) 
-FROM model_a 
-WHERE foreign_key NOT IN (SELECT primary_key FROM model_b);
-
-- Match percentage for relationship verification
-SELECT (
-  SELECT COUNT(*) 
-  FROM model_a 
-  JOIN model_b ON model_a.foreign_key = model_b.primary_key
-) * 100.0 / (SELECT COUNT(*) FROM model_a);
-
-- Sample values
-SELECT column FROM table_name LIMIT 100;
-```
-
-{
-  "type": "object",
-  "properties": {
-    "query": {
-      "type": "string",
-      "description": "The SQL query to execute (read-only access)"
-    },
-    "description": {
-      "type": "string",
-      "description": "Brief description of what this query is checking or retrieving (e.g., 'Check row count for orders table', 'Verify customer_id relationship')"
-    }
-  },
-  "required": [
-    "query"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## ExitPlanMode
-
-Use this tool when you are in plan mode and have finished presenting your plan and are ready to code. This will prompt the user to exit plan mode. 
-IMPORTANT: Only use this tool when the task requires planning the implementation steps of a task that requires writing code or documentation. For research tasks where you're gathering information, searching files, reading files or in general trying to understand the codebase - do NOT use this tool.
-
-Eg. 
-1. Initial task: "Search for and understand how customer revenue is calculated" - Do not use the exit plan mode tool because you are researching and understanding.
-2. Initial task: "Help me document the orders model" - Use the exit plan mode tool after you have finished planning the documentation steps.
-
-{
-  "type": "object",
-  "properties": {
-    "plan": {
-      "type": "string",
-      "description": "The plan you came up with, that you want to run by the user for approval. Supports markdown. The plan should be pretty concise."
-    }
-  },
-  "required": [
-    "plan"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Glob
-
- Fast file pattern matching tool that works with any codebase size
- Supports glob patterns like "**/*.yml" or "models/**/*.sql"
- Returns matching file paths sorted by modification time
- Use this tool when you need to find files by name patterns
- When you are doing an open ended search that may require multiple rounds of globbing and grepping, use the Task tool instead
- You have the capability to call multiple tools in a single response. It is always better to speculatively perform multiple searches as a batch that are potentially useful.
-{
-  "type": "object",
-  "properties": {
-    "pattern": {
-      "type": "string",
-      "description": "The glob pattern to match files against"
-    },
-    "path": {
-      "type": "string",
-      "description": "The directory to search in. If not specified, the current working directory will be used. IMPORTANT: Omit this field to use the default directory. DO NOT enter \"undefined\" or \"null\" - simply omit it for the default behavior. Must be a valid directory path if provided."
-    }
-  },
-  "required": [
-    "pattern"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Grep
-
-A powerful search tool built on ripgrep
-
-  Usage:
-  - ALWAYS use Grep for search tasks. NEVER invoke `grep` or `rg` as a Bash command. The Grep tool has been optimized for correct permissions and access.
-  - Supports full regex syntax (e.g., "revenue", "ref\('.*'\)")
-  - Filter files with glob parameter (e.g., "*.yml", "**/*.sql") or type parameter
-  - Output modes: "content" shows matching lines, "files_with_matches" shows only file paths (default), "count" shows match counts
-  - Use Task tool for open-ended searches requiring multiple rounds
-  - Pattern syntax: Uses ripgrep (not grep) - literal braces need escaping
-  - Multiline matching: By default patterns match within single lines only. For cross-line patterns, use `multiline: true`
-
-{
-  "type": "object",
-  "properties": {
-    "pattern": {
-      "type": "string",
-      "description": "The regular expression pattern to search for in file contents"
-    },
-    "path": {
-      "type": "string",
-      "description": "File or directory to search in (rg PATH). Defaults to current working directory."
-    },
-    "glob": {
-      "type": "string",
-      "description": "Glob pattern to filter files (e.g. \"*.yml\", \"*.{sql,yml}\") - maps to rg --glob"
-    },
-    "output_mode": {
-      "type": "string",
-      "enum": [
-        "content",
-        "files_with_matches",
-        "count"
-      ],
-      "description": "Output mode: \"content\" shows matching lines (supports -A/-B/-C context, -n line numbers, head_limit), \"files_with_matches\" shows file paths (supports head_limit), \"count\" shows match counts (supports head_limit). Defaults to \"files_with_matches\"."
-    },
-    "-B": {
-      "type": "number",
-      "description": "Number of lines to show before each match (rg -B). Requires output_mode: \"content\", ignored otherwise."
-    },
-    "-A": {
-      "type": "number",
-      "description": "Number of lines to show after each match (rg -A). Requires output_mode: \"content\", ignored otherwise."
-    },
-    "-C": {
-      "type": "number",
-      "description": "Number of lines to show before and after each match (rg -C). Requires output_mode: \"content\", ignored otherwise."
-    },
-    "-n": {
-      "type": "boolean",
-      "description": "Show line numbers in output (rg -n). Requires output_mode: \"content\", ignored otherwise."
-    },
-    "-i": {
-      "type": "boolean",
-      "description": "Case insensitive search (rg -i)"
-    },
-    "type": {
-      "type": "string",
-      "description": "File type to search (rg --type). Common types: sql, yaml, markdown, etc. More efficient than glob for standard file types."
-    },
-    "head_limit": {
-      "type": "number",
-      "description": "Limit output to first N lines/entries, equivalent to \"| head -N\". Works across all output modes: content (limits output lines), files_with_matches (limits file paths), count (limits count entries). When unspecified, shows all results from ripgrep."
-    },
-    "multiline": {
-      "type": "boolean",
-      "description": "Enable multiline mode where . matches newlines and patterns can span lines (rg -U --multiline-dotall). Default: false."
-    }
-  },
-  "required": [
-    "pattern"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## KillShell
-
- Kills a running background bash shell by its ID
- Takes a shell_id parameter identifying the shell to kill
- Returns a success or failure status 
- Use this tool when you need to terminate a long-running shell
- Shell IDs can be found using the /bashes command
-
-{
-  "type": "object",
-  "properties": {
-    "shell_id": {
-      "type": "string",
-      "description": "The ID of the background shell to kill"
-    }
-  },
-  "required": [
-    "shell_id"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## NotebookEdit
-
-Completely replaces the contents of a specific cell in a Jupyter notebook (.ipynb file) with new source. Jupyter notebooks are interactive documents that combine code, text, and visualizations, commonly used for data analysis and scientific computing. The notebook_path parameter must be an absolute path, not a relative path. The cell_number is 0-indexed. Use edit_mode=insert to add a new cell at the index specified by cell_number. Use edit_mode=delete to delete the cell at the index specified by cell_number.
-{
-  "type": "object",
-  "properties": {
-    "notebook_path": {
-      "type": "string",
-      "description": "The absolute path to the Jupyter notebook file to edit (must be absolute, not relative)"
-    },
-    "cell_id": {
-      "type": "string",
-      "description": "The ID of the cell to edit. When inserting a new cell, the new cell will be inserted after the cell with this ID, or at the beginning if not specified."
-    },
-    "new_source": {
-      "type": "string",
-      "description": "The new source for the cell"
-    },
-    "cell_type": {
-      "type": "string",
-      "enum": [
-        "code",
-        "markdown"
-      ],
-      "description": "The type of the cell (code or markdown). If not specified, it defaults to the current cell type. If using edit_mode=insert, this is required."
-    },
-    "edit_mode": {
-      "type": "string",
-      "enum": [
-        "replace",
-        "insert",
-        "delete"
-      ],
-      "description": "The type of edit to make (replace, insert, delete). Defaults to replace."
-    }
-  },
-  "required": [
-    "notebook_path",
-    "new_source"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Read
-
-Reads a file from the local filesystem. You can access any file directly by using this tool.
-Assume this tool is able to read all files on the machine. If the User provides a path to a file assume that path is valid. It is okay to read a file that does not exist; an error will be returned.
-
-Usage:
- The file_path parameter must be an absolute path, not a relative path
- By default, it reads up to 2000 lines starting from the beginning of the file
- You can optionally specify a line offset and limit (especially handy for long files), but it's recommended to read the whole file by not providing these parameters
- Any lines longer than 2000 characters will be truncated
- Results are returned using cat -n format, with line numbers starting at 1
- This tool allows Buster to read images (eg PNG, JPG, etc). When reading an image file the contents are presented visually as Buster is a multimodal LLM.
- This tool can read PDF files (.pdf). PDFs are processed page by page, extracting both text and visual content for analysis.
- This tool can read Jupyter notebooks (.ipynb files) and returns all cells with their outputs, combining code, text, and visualizations.
- This tool can only read files, not directories. To read a directory, use an ls command via the Bash tool.
- You have the capability to call multiple tools in a single response. It is always better to speculatively read multiple files as a batch that are potentially useful. 
- If you read a file that exists but has empty contents you will receive a system reminder warning in place of file contents.
-{
-  "type": "object",
-  "properties": {
-    "file_path": {
-      "type": "string",
-      "description": "The absolute path to the file to read"
-    },
-    "offset": {
-      "type": "number",
-      "description": "The line number to start reading from. Only provide if the file is too large to read at once"
-    },
-    "limit": {
-      "type": "number",
-      "description": "The number of lines to read. Only provide if the file is too large to read at once."
-    }
-  },
-  "required": [
-    "file_path"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## RetrieveMetadata
-
-Retrieves pre-populated metadata for models and columns from the data warehouse.
-
-This metadata is generated from:
- `dbt docs generate` output: DAG, lineage, compiled SQL, existing descriptions, tables, columns, data types
- Warehouse statistics: row count, null rate, null count, data size, last updated timestamp
- Column-level metrics: unique value percentage, min/max values, average, standard deviation, distinct count, sample values
-
-IMPORTANT: Always check metadata BEFORE using ExecuteSql - the information you need is often already here. This is faster and more efficient than running queries.
-
-Usage:
- Specify the model/table name (required)
- Optionally specify a column/field name to retrieve column-specific metadata
- If no column is specified, returns table-level metadata and summary of all columns
- Use this metadata to inform your documentation in .yml files
-
-{
-  "type": "object",
-  "properties": {
-    "model_name": {
-      "type": "string",
-      "description": "The name of the model/table to retrieve metadata for (required)"
-    },
-    "column_name": {
-      "type": "string",
-      "description": "Optional: specific column/field to retrieve metadata for. If omitted, returns table-level metadata and all columns summary."
-    }
-  },
-  "required": [
-    "model_name"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## SlashCommand
-
-Execute a slash command within the main conversation
-Usage:
- `command` (required): The slash command to execute, including any arguments
- Example: `command: "/review-pr 123"`
-Important Notes:
- Only available slash commands can be executed.
- Some commands may require arguments as shown in the command list above
- If command validation fails, list up to 5 available commands, not all of them.
- Do not use this tool if you are already processing a slash command with the same name as indicated by <command-message>{name_of_command} is running…</command-message>
-Available Commands:
-
-{
-  "type": "object",
-  "properties": {
-    "command": {
-      "type": "string",
-      "description": "The slash command to execute with its arguments, e.g., \"/review-pr 123\""
-    }
-  },
-  "required": [
-    "command"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Task
-
-Launch a new agent to handle complex, multi-step tasks autonomously. 
-
-Available agent types and the tools they have access to:
- general-purpose: General-purpose agent for researching complex questions, searching for code, and executing multi-step tasks. When you are searching for a keyword or file and are not confident that you will find the right match in the first few tries use this agent to perform the search for you. (Tools: *)
- data-explorer: Use this agent to explore and analyze data across multiple models, useful for understanding data patterns, distributions, and relationships. (Tools: Read, RetrieveMetadata, ExecuteSql, Grep, Glob)
- documentation-writer: Use this agent to write comprehensive documentation for models following the custom framework. (Tools: Read, Edit, Write, RetrieveMetadata, ExecuteSql, Grep, Glob)
-
-When using the Task tool, you must specify a subagent_type parameter to select which agent type to use.
-
-When NOT to use the Task tool:
- If you want to read a specific file path, use the Read or Glob tool instead of the Task tool, to find the match more quickly
- If you are searching for a specific model definition, use the Glob tool instead, to find the match more quickly
- If you are searching within a specific file or set of 2-3 files, use the Read tool instead of the Task tool, to find the match more quickly
- Other tasks that are not related to the agent descriptions above
-
-Usage notes:
-1. Launch multiple agents concurrently whenever possible, to maximize performance; to do that, use a single message with multiple tool uses
-2. When the agent is done, it will return a single message back to you. The result returned by the agent is not visible to the user. To show the user the result, you should send a text message back to the user with a concise summary of the result.
-3. Each agent invocation is stateless. You will not be able to send additional messages to the agent, nor will the agent be able to communicate with you outside of its final report. Therefore, your prompt should contain a highly detailed task description for the agent to perform autonomously and you should specify exactly what information the agent should return back to you in its final and only message to you.
-4. The agent's outputs should generally be trusted
-5. Clearly tell the agent whether you expect it to write code/documentation or just to do research (search, file reads, metadata retrieval, etc.), since it is not aware of the user's intent
-6. If the agent description mentions that it should be used proactively, then you should try your best to use it without the user having to ask for it first. Use your judgement.
-7. If the user specifies that they want you to run agents "in parallel", you MUST send a single message with multiple Task tool use content blocks.
-
-Example usage:
-
-<example_agent_descriptions>
-"documentation-writer": use this agent to write comprehensive documentation after you've gathered the necessary context
-"data-explorer": use this agent to explore data patterns when the user asks about data distributions or relationships
-</example_agent_description>
-
-<example>
-user: "Document the orders model"
-assistant: Let me gather context about the orders model first
-assistant: [Uses Read to read orders.sql and orders.yml, uses RetrieveMetadata to get table metadata]
-assistant: Now I'll use the documentation-writer agent to create comprehensive documentation
-assistant: [Uses Task tool to launch documentation-writer agent with detailed instructions]
-</example>
-
-<example>
-user: "What's the relationship between customers and orders?"
-<commentary>
-This requires data exploration to verify the relationship
-</commentary>
-assistant: I'll use the data-explorer agent to investigate this relationship
-assistant: [Uses Task tool to launch data-explorer agent]
-</example>
-
-{
-  "type": "object",
-  "properties": {
-    "description": {
-      "type": "string",
-      "description": "A short (3-5 word) description of the task"
-    },
-    "prompt": {
-      "type": "string",
-      "description": "The task for the agent to perform"
-    },
-    "subagent_type": {
-      "type": "string",
-      "description": "The type of specialized agent to use for this task"
-    }
-  },
-  "required": [
-    "description",
-    "prompt",
-    "subagent_type"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## TodoWrite
-
-Use this tool to create and manage a structured task list for your current analytics engineering session. This helps you track progress, organize complex tasks, and demonstrate thoroughness to the user.
-It also helps the user understand the progress of the task and overall progress of their requests.
-
-#### When to Use This Tool
-Use this tool proactively in these scenarios:
-
-1. Complex multi-step tasks - When a task requires 3 or more distinct steps or actions
-2. Non-trivial and complex tasks - Tasks that require careful planning or multiple operations
-3. User explicitly requests todo list - When the user directly asks you to use the todo list
-4. User provides multiple tasks - When users provide a list of things to be done (numbered or comma-separated)
-5. After receiving new instructions - Immediately capture user requirements as todos
-6. When you start working on a task - Mark it as in_progress BEFORE beginning work. Ideally you should only have one todo as in_progress at a time
-7. After completing a task - Mark it as completed and add any new follow-up tasks discovered during implementation
-
-#### When NOT to Use This Tool
-
-Skip using this tool when:
-1. There is only a single, straightforward task
-2. The task is trivial and tracking it provides no organizational benefit
-3. The task can be completed in less than 3 trivial steps
-4. The task is purely conversational or informational
-
-NOTE that you should not use this tool if there is only one trivial task to do. In this case you are better off just doing the task directly.
-
-#### Examples of When to Use the Todo List
-
-<example>
-User: Document the orders model completely
-Assistant: I'll help document the orders model comprehensively. Let me create a todo list to track this work.
-*Creates todo list with the following items:*
-1. Retrieve metadata for orders model
-2. Read orders.sql to understand transformations
-3. Read existing orders.yml documentation
-4. Write comprehensive table definition
-5. Document all dimensions and measures
-6. Identify and verify relationships with other models
-7. Classify ENUM and Stored Value columns
-8. Review and update documentation for completeness
-*Begins working on the first task*
-
-<reasoning>
-The assistant used the todo list because:
-1. Documenting a model is a multi-step process requiring metadata retrieval, file reading, SQL analysis, and comprehensive documentation
-2. Breaking down the task helps ensure nothing is missed
-3. The user can see progress through each documentation phase
-</reasoning>
-</example>
-
-<example>
-User: I need to understand how revenue is calculated across our models, verify the customer-to-orders relationship, and document any data quality issues you find.
-Assistant: I'll help with all three tasks. Let me create a todo list to organize this work.
-*Creates todo list with specific items for each request*
-
-<reasoning>
-The assistant used the todo list because:
-1. The user provided multiple distinct tasks in a comma-separated list
-2. Each task requires different approaches and multiple sub-steps
-3. The todo list helps track progress across all three requests systematically
-</reasoning>
-</example>
-
-<example>
-User: What's the row count for the orders table?
-Assistant: [Retrieves metadata for orders table]
-2,847,293
-
-<reasoning>
-The assistant did not use the todo list because this is a single, straightforward task that can be completed with one tool call. There's no need to track multiple steps.
-</reasoning>
-</example>
-
-<example>
-User: Show me the description of the customer_name column in the customers model
-Assistant: [Reads customers.yml file]
-"The full name of the customer as provided during account registration. Used for personalization and customer identification."
-
-<reasoning>
-The assistant did not use the todo list because this is a simple information retrieval task with a single step.
-</reasoning>
-</example>
-
-#### Task States and Management
-
-1. **Task States**: Use these states to track progress:
-   - pending: Task not yet started
-   - in_progress: Currently working on (limit to ONE task at a time)
-   - completed: Task finished successfully
-
-   **IMPORTANT**: Task descriptions must have two forms:
-   - content: The imperative form describing what needs to be done (e.g., "Document orders model", "Verify customer relationship")
-   - activeForm: The present continuous form shown during execution (e.g., "Documenting orders model", "Verifying customer relationship")
-
-2. **Task Management**:
-   - Update task status in real-time as you work
-   - Mark tasks complete IMMEDIATELY after finishing (don't batch completions)
-   - Exactly ONE task must be in_progress at any time (not less, not more)
-   - Complete current tasks before starting new ones
-   - Remove tasks that are no longer relevant from the list entirely
-
-3. **Task Completion Requirements**:
-   - ONLY mark a task as completed when you have FULLY accomplished it
-   - If you encounter errors, blockers, or cannot finish, keep the task as in_progress
-   - When blocked, create a new task describing what needs to be resolved
-   - Never mark a task as completed if:
-     - Documentation is incomplete
-     - SQL queries failed or returned unexpected results
-     - Relationships couldn't be verified
-     - You couldn't find necessary files or metadata
-
-4. **Task Breakdown**:
-   - Create specific, actionable items
-   - Break complex tasks into smaller, manageable steps
-   - Use clear, descriptive task names
-   - Always provide both forms:
-     - content: "Verify customer-orders relationship"
-     - activeForm: "Verifying customer-orders relationship"
-
-When in doubt, use this tool. Being proactive with task management demonstrates attentiveness and ensures you complete all requirements successfully.
-
-{
-  "type": "object",
-  "properties": {
-    "todos": {
-      "type": "array",
-      "items": {
-        "type": "object",
-        "properties": {
-          "content": {
-            "type": "string",
-            "minLength": 1
-          },
-          "status": {
-            "type": "string",
-            "enum": [
-              "pending",
-              "in_progress",
-              "completed"
-            ]
-          },
-          "activeForm": {
-            "type": "string",
-            "minLength": 1
-          }
-        },
-        "required": [
-          "content",
-          "status",
-          "activeForm"
-        ],
-        "additionalProperties": false
-      },
-      "description": "The updated todo list"
-    }
-  },
-  "required": [
-    "todos"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## WebFetch
-
- Fetches content from a specified URL and processes it using an AI model
- Takes a URL and a prompt as input
- Fetches the URL content, converts HTML to markdown
- Processes the content with the prompt using a small, fast model
- Returns the model's response about the content
- Use this tool when you need to retrieve and analyze web content
-
-Usage notes:
-  - IMPORTANT: If an MCP-provided web fetch tool is available, prefer using that tool instead of this one, as it may have fewer restrictions. All MCP-provided tools start with "mcp__".
-  - The URL must be a fully-formed valid URL
-  - HTTP URLs will be automatically upgraded to HTTPS
-  - The prompt should describe what information you want to extract from the page
-  - This tool is read-only and does not modify any files
-  - Results may be summarized if the content is very large
-  - Includes a self-cleaning 15-minute cache for faster responses when repeatedly accessing the same URL
-  - When a URL redirects to a different host, the tool will inform you and provide the redirect URL in a special format. You should then make a new WebFetch request with the redirect URL to fetch the content.
-
-{
-  "type": "object",
-  "properties": {
-    "url": {
-      "type": "string",
-      "format": "uri",
-      "description": "The URL to fetch content from"
-    },
-    "prompt": {
-      "type": "string",
-      "description": "The prompt to run on the fetched content"
-    }
-  },
-  "required": [
-    "url",
-    "prompt"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## WebSearch
-
- Allows Buster to search the web and use the results to inform responses
- Provides up-to-date information for current events and recent data
- Returns search result information formatted as search result blocks
- Use this tool for accessing information beyond Buster's knowledge cutoff
- Searches are performed automatically within a single API call
-
-Usage notes:
-  - Domain filtering is supported to include or block specific websites
-  - Web search is only available in the US
-  - Account for "Today's date" in <env>. For example, if <env> says "Today's date: 2025-07-01", and the user wants the latest docs, do not use 2024 in the search query. Use 2025.
-
-{
-  "type": "object",
-  "properties": {
-    "query": {
-      "type": "string",
-      "minLength": 2,
-      "description": "The search query to use"
-    },
-    "allowed_domains": {
-      "type": "array",
-      "items": {
-        "type": "string"
-      },
-      "description": "Only include search results from these domains"
-    },
-    "blocked_domains": {
-      "type": "array",
-      "items": {
-        "type": "string"
-      },
-      "description": "Never include search results from these domains"
-    }
-  },
-  "required": [
-    "query"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
-
---
-
-## Write
-
-Writes a file to the local filesystem.
-
-Usage:
- This tool will overwrite the existing file if there is one at the provided path.
- If this is an existing file, you MUST use the Read tool first to read the file's contents. This tool will fail if you did not read the file first.
- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.
- Only use emojis if the user explicitly requests it. Avoid writing emojis to files unless asked.
- When writing YAML files, ensure proper formatting and indentation
- When writing Markdown files, use appropriate headers, lists, and formatting for clarity
-{
-  "type": "object",
-  "properties": {
-    "file_path": {
-      "type": "string",
-      "description": "The absolute path to the file to write (must be absolute, not relative)"
-    },
-    "content": {
-      "type": "string",
-      "description": "The content to write to the file"
-    }
-  },
-  "required": [
-    "file_path",
-    "content"
-  ],
-  "additionalProperties": false,
-  "$schema": "http://json-schema.org/draft-07/schema#"
-}
+</example>
--- a/packages/ai/src/agents/analytics-engineer-agent/analytics-engineer-agent.ts
+++ b/packages/ai/src/agents/analytics-engineer-agent/analytics-engineer-agent.ts
@ -6,6 +6,7 @@ import z from 'zod';
 import { DEFAULT_ANTHROPIC_OPTIONS } from '../../llm/providers/gateway';
 import { Sonnet4 } from '../../llm/sonnet-4';
 import { createIdleTool } from '../../tools';
+import { IDLE_TOOL_NAME } from '../../tools/communication-tools/idle-tool/idle-tool';
 import {
  createEditFileTool,
  createLsTool,
@ -13,8 +14,13 @@ import {
  createWriteFileTool,
 } from '../../tools/file-tools';
 import { createBashTool } from '../../tools/file-tools/bash-tool/bash-tool';
-import { createGrepTool } from '../../tools/file-tools/grep-tool/grep-tool';
-import { createReadFileTool } from '../../tools/file-tools/read-file-tool/read-file-tool';
+import { BASH_TOOL_NAME } from '../../tools/file-tools/bash-tool/bash-tool';
+import { EDIT_FILE_TOOL_NAME } from '../../tools/file-tools/edit-file-tool/edit-file-tool';
+import { GREP_TOOL_NAME, createGrepTool } from '../../tools/file-tools/grep-tool/grep-tool';
+import { LS_TOOL_NAME } from '../../tools/file-tools/ls-tool/ls-tool';
+import { MULTI_EDIT_FILE_TOOL_NAME } from '../../tools/file-tools/multi-edit-file-tool/multi-edit-file-tool';
+import { READ_FILE_TOOL_NAME, createReadFileTool } from '../../tools/file-tools/read-file-tool/read-file-tool';
+import { WRITE_FILE_TOOL_NAME } from '../../tools/file-tools/write-file-tool/write-file-tool';
 import { createTaskTool } from '../../tools/task-tools/task-tool/task-tool';
 import { type AgentContext, repairToolCall } from '../../utils/tool-call-repair';
 import { getDocsAgentSystemPrompt as getAnalyticsEngineerAgentSystemPrompt } from './get-analytics-engineer-agent-system-prompt';
@ -22,7 +28,7 @@ import type { ToolEventCallback } from './tool-events';

 export const ANALYST_ENGINEER_AGENT_NAME = 'analyticsEngineerAgent';

-const STOP_CONDITIONS = [stepCountIs(100), hasToolCall('idleTool')];
+const STOP_CONDITIONS = [stepCountIs(100), hasToolCall(IDLE_TOOL_NAME)];

 const AnalyticsEngineerAgentOptionsSchema = z.object({
  folder_structure: z.string().describe('The file structure of the dbt repository'),
@ -78,89 +84,76 @@ export function createAnalyticsEngineerAgent(
  } as ModelMessage;

  const idleTool = createIdleTool({
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const writeFileTool = createWriteFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const grepTool = createGrepTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const readFileTool = createReadFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const bashTool = createBashTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const editFileTool = createEditFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const multiEditFileTool = createMultiEditFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const lsTool = createLsTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });

  // Conditionally create task tool (only for main agent, not for subagents)
  const taskTool = !analyticsEngineerAgentOptions.isSubagent
    ? createTaskTool({
-        messageId: analyticsEngineerAgentOptions.messageId,
-        projectDirectory: analyticsEngineerAgentOptions.folder_structure,
-        // Wrap onToolEvent to ensure type compatibility - no optional chaining
-        ...(analyticsEngineerAgentOptions.onToolEvent && {
-          // biome-ignore lint/suspicious/noExplicitAny: Bridging between ToolEventType and parent's ToolEvent type
-          onToolEvent: (event) => analyticsEngineerAgentOptions.onToolEvent?.(event as any),
-        }),
-        // Pass the agent factory function to enable task agent creation
-        // This needs to match the AgentFactory type signature
-        createAgent: (options) => {
-          return createAnalyticsEngineerAgent({
-            ...options,
-            // Inherit model from parent agent if provided
-            model: analyticsEngineerAgentOptions.model,
-          });
-        },
-      })
+      messageId: analyticsEngineerAgentOptions.messageId,
+      projectDirectory: analyticsEngineerAgentOptions.folder_structure,
+      // Wrap onToolEvent to ensure type compatibility - no optional chaining
+      ...(analyticsEngineerAgentOptions.onToolEvent && {
+        // biome-ignore lint/suspicious/noExplicitAny: Bridging between ToolEventType and parent's ToolEvent type
+        onToolEvent: (event) => analyticsEngineerAgentOptions.onToolEvent?.(event as any),
+      }),
+      // Pass the agent factory function to enable task agent creation
+      // This needs to match the AgentFactory type signature
+      createAgent: (options) => {
+        return createAnalyticsEngineerAgent({
+          ...options,
+          // Inherit model from parent agent if provided
+          model: analyticsEngineerAgentOptions.model,
+        });
+      },
+    })
    : null;

  // Create planning tools with simple context
  async function stream({ messages }: AnalyticsEngineerAgentStreamOptions) {
-    // Collect available tools dynamically based on what's enabled
-    const availableTools: string[] = ['sequentialThinking'];
-    availableTools.push('executeSql');
-    availableTools.push('updateClarificationsFile', 'checkOffTodoList', 'idleTool', 'webSearch');
-
    const agentContext: AgentContext = {
      agentName: ANALYST_ENGINEER_AGENT_NAME,
-      availableTools,
+      availableTools: [IDLE_TOOL_NAME, GREP_TOOL_NAME, WRITE_FILE_TOOL_NAME, READ_FILE_TOOL_NAME, BASH_TOOL_NAME, EDIT_FILE_TOOL_NAME, MULTI_EDIT_FILE_TOOL_NAME, LS_TOOL_NAME],
    };

    // Build tools object conditionally including task tool
    // biome-ignore lint/suspicious/noExplicitAny: tools object contains various tool types
    const tools: Record<string, any> = {
-      idleTool,
-      grepTool,
-      writeFileTool,
-      readFileTool,
-      bashTool,
-      editFileTool,
-      multiEditFileTool,
-      lsTool,
+      [IDLE_TOOL_NAME]: idleTool,
+      [GREP_TOOL_NAME]: grepTool,
+      [WRITE_FILE_TOOL_NAME]: writeFileTool,
+      [READ_FILE_TOOL_NAME]: readFileTool,
+      [BASH_TOOL_NAME]: bashTool,
+      [EDIT_FILE_TOOL_NAME]: editFileTool,
+      [MULTI_EDIT_FILE_TOOL_NAME]: multiEditFileTool,
+      [LS_TOOL_NAME]: lsTool,
    };

    // Add task tool only if not a subagent (prevent recursion)
--- a/packages/ai/src/tools/communication-tools/idle-tool/idle-tool.ts
+++ b/packages/ai/src/tools/communication-tools/idle-tool/idle-tool.ts
@ -2,6 +2,8 @@ import { tool } from 'ai';
 import { wrapTraced } from 'braintrust';
 import { z } from 'zod';

+export const IDLE_TOOL_NAME = 'idle';
+
 // Input/Output schemas
 const IdleInputSchema = z.object({
  final_response: z
@ -39,7 +41,7 @@ function createIdleExecute<TAgentContext extends IdleContext = IdleContext>(

      // Emit typed tool event when idle tool completes
      context?.onToolEvent?.({
-        tool: 'idleTool',
+        tool: IDLE_TOOL_NAME,
        event: 'complete',
        result,
        args,
--- a/packages/ai/src/tools/file-tools/bash-tool/bash-tool.ts
+++ b/packages/ai/src/tools/file-tools/bash-tool/bash-tool.ts
@ -3,6 +3,8 @@ import { z } from 'zod';
 import BASH_TOOL_DESCRIPTION from './bash-tool-description.txt';
 import { createBashToolExecute } from './bash-tool-execute';

+export const BASH_TOOL_NAME = 'bash';
+
 export const BashToolInputSchema = z.object({
  command: z.string().describe('The bash command to execute'),
  description: z
--- a/packages/ai/src/tools/file-tools/edit-file-tool/edit-file-tool.ts
+++ b/packages/ai/src/tools/file-tools/edit-file-tool/edit-file-tool.ts
@ -3,6 +3,8 @@ import { z } from 'zod';
 import { createEditFileToolExecute } from './edit-file-tool-execute';
 import DESCRIPTION from './edit.txt';

+export const EDIT_FILE_TOOL_NAME = 'edit';
+
 export const EditFileToolInputSchema = z.object({
  filePath: z.string().describe('The absolute path to the file to modify'),
  oldString: z.string().describe('The text to replace'),
--- a/packages/ai/src/tools/file-tools/grep-tool/grep-tool.ts
+++ b/packages/ai/src/tools/file-tools/grep-tool/grep-tool.ts
@ -3,6 +3,8 @@ import { z } from 'zod';
 import GREP_TOOL_DESCRIPTION from './grep-tool-description.txt';
 import { createGrepSearchToolExecute as createGrepToolExecute } from './grep-tool.test';

+export const GREP_TOOL_NAME = 'grep';
+
 const GrepMatchSchema = z.object({
  path: z.string().describe('File path where the match was found'),
  lineNum: z.number().describe('Line number of the match'),
--- a/packages/ai/src/tools/file-tools/ls-tool/ls-tool.ts
+++ b/packages/ai/src/tools/file-tools/ls-tool/ls-tool.ts
@ -3,6 +3,8 @@ import { z } from 'zod';
 import { createLsToolExecute } from './ls-tool-execute';
 import DESCRIPTION from './ls.txt';

+export const LS_TOOL_NAME = 'ls';
+
 export const LsToolInputSchema = z.object({
  path: z
    .string()
--- a/packages/ai/src/tools/file-tools/multi-edit-file-tool/multi-edit-file-tool.ts
+++ b/packages/ai/src/tools/file-tools/multi-edit-file-tool/multi-edit-file-tool.ts
@ -3,6 +3,8 @@ import { z } from 'zod';
 import { createMultiEditFileToolExecute } from './multi-edit-file-tool-execute';
 import DESCRIPTION from './multiedit.txt';

+export const MULTI_EDIT_FILE_TOOL_NAME = 'multiEdit';
+
 const EditOperationSchema = z.object({
  oldString: z.string().describe('The text to replace'),
  newString: z.string().describe('The text to replace it with (must be different from oldString)'),
--- a/packages/ai/src/tools/file-tools/read-file-tool/read-file-tool.ts
+++ b/packages/ai/src/tools/file-tools/read-file-tool/read-file-tool.ts
@ -2,6 +2,8 @@ import { tool } from 'ai';
 import { z } from 'zod';
 import { createReadFileToolExecute } from './read-file-tool-execute';

+export const READ_FILE_TOOL_NAME = 'read';
+
 export const ReadFileToolInputSchema = z.object({
  filePath: z
    .string()
--- a/packages/ai/src/tools/file-tools/write-file-tool/write-file-tool.ts
+++ b/packages/ai/src/tools/file-tools/write-file-tool/write-file-tool.ts
@ -2,6 +2,8 @@ import { tool } from 'ai';
 import { z } from 'zod';
 import { createWriteFileToolExecute } from './write-file-tool-execute';

+export const WRITE_FILE_TOOL_NAME = 'write';
+
 const FileCreateParamsSchema = z.object({
  path: z.string().describe('The relative or absolute path to create the file at'),
  content: z.string().describe('The content to write to the file'),