buster/packages/ai/src/agents/analytics-engineer-agent/analytics-engineer-agent.ts

import type { LanguageModelV2 } from '@ai-sdk/provider';
import type { Sandbox } from '@buster/sandbox';
import { type ModelMessage, hasToolCall, stepCountIs, streamText } from 'ai';
import { wrapTraced } from 'braintrust';
import z from 'zod';
import { DEFAULT_ANTHROPIC_OPTIONS } from '../../llm/providers/gateway';
import { Sonnet4 } from '../../llm/sonnet-4';
import { createIdleTool } from '../../tools';
import { createEditFileTool, createLsTool, createMultiEditFileTool, createWriteFileTool } from '../../tools/file-tools';
import { createBashTool } from '../../tools/file-tools/bash-tool/bash-tool';
import { createGrepTool } from '../../tools/file-tools/grep-tool/grep-tool';
import { createReadFileTool } from '../../tools/file-tools/read-file-tool/read-file-tool';
import { type AgentContext, repairToolCall } from '../../utils/tool-call-repair';
import { getDocsAgentSystemPrompt as getAnalyticsEngineerAgentSystemPrompt } from './get-analytics-engineer-agent-system-prompt';
import type { ToolEventCallback } from './tool-events';

export const ANALYST_ENGINEER_AGENT_NAME = 'analyticsEngineerAgent';

const STOP_CONDITIONS = [stepCountIs(100), hasToolCall('idleTool')];

const AnalyticsEngineerAgentOptionsSchema = z.object({
  folder_structure: z.string().describe('The file structure of the dbt repository'),
  userId: z.string(),
  chatId: z.string(),
  dataSourceId: z.string(),
  organizationId: z.string(),
  messageId: z.string(),
  sandbox: z
    .custom<Sandbox>(
      (val) => {
        return val && typeof val === 'object' && 'id' in val && 'fs' in val;
      },
      { message: 'Invalid Sandbox instance' }
    )
    .optional(),
  model: z
    .custom<LanguageModelV2>()
    .optional()
    .describe('Custom language model to use (defaults to Sonnet4)'),
});

const AnalyticsEngineerAgentStreamOptionsSchema = z.object({
  messages: z.array(z.custom<ModelMessage>()).describe('The messages to send to the docs agent'),
});

export type AnalyticsEngineerAgentOptions = z.infer<typeof AnalyticsEngineerAgentOptionsSchema> & {
  onToolEvent?: ToolEventCallback;
};
export type AnalyticsEngineerAgentStreamOptions = z.infer<typeof AnalyticsEngineerAgentStreamOptionsSchema>;

// Extended type for passing to tools (includes sandbox)
export type DocsAgentContextWithSandbox = AnalyticsEngineerAgentOptions & { sandbox: Sandbox };

export function createAnalyticsEngineerAgent(analyticsEngineerAgentOptions: AnalyticsEngineerAgentOptions) {
  const systemMessage = {
    role: 'system',
    content: getAnalyticsEngineerAgentSystemPrompt(analyticsEngineerAgentOptions.folder_structure),
    providerOptions: DEFAULT_ANTHROPIC_OPTIONS,
  } as ModelMessage;

  const idleTool = createIdleTool({
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const writeFileTool = createWriteFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const grepTool = createGrepTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const readFileTool = createReadFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
  });
  const bashTool = createBashTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const editFileTool = createEditFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const multiEditFileTool = createMultiEditFileTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });
  const lsTool = createLsTool({
    messageId: analyticsEngineerAgentOptions.messageId,
    projectDirectory: analyticsEngineerAgentOptions.folder_structure,
    onToolEvent: analyticsEngineerAgentOptions.onToolEvent,
  });

  // Create planning tools with simple context
  async function stream({ messages }: AnalyticsEngineerAgentStreamOptions) {
    // Collect available tools dynamically based on what's enabled
    const availableTools: string[] = ['sequentialThinking'];
    availableTools.push('executeSql');
    availableTools.push('updateClarificationsFile', 'checkOffTodoList', 'idleTool', 'webSearch');

    const agentContext: AgentContext = {
      agentName: ANALYST_ENGINEER_AGENT_NAME,
      availableTools,
    };

    return wrapTraced(
      () =>
        streamText({
          model: analyticsEngineerAgentOptions.model || Sonnet4,
          providerOptions: DEFAULT_ANTHROPIC_OPTIONS,
          tools: {
            idleTool,
            grepTool,
            writeFileTool,
            readFileTool,
            bashTool,
            editFileTool,
            multiEditFileTool,
            lsTool,
          },
          messages: [systemMessage, ...messages],
          stopWhen: STOP_CONDITIONS,
          toolChoice: 'required',
          maxOutputTokens: 10000,
          temperature: 0,
          experimental_context: analyticsEngineerAgentOptions,
          experimental_repairToolCall: async (repairContext) => {
            return repairToolCall({
              toolCall: repairContext.toolCall,
              tools: repairContext.tools,
              error: repairContext.error,
              messages: repairContext.messages,
              ...(repairContext.system && { system: repairContext.system }),
              ...(repairContext.inputSchema && { inputSchema: repairContext.inputSchema }),
              agentContext,
            });
          },
        }),
      {
        name: 'Docs Agent',
      }
    )();
  }

  return {
    stream,
  };
}
ok proxy with handler in cli working 2025-10-01 10:49:25 +08:00			`import type { LanguageModelV2 } from '@ai-sdk/provider';`
add in api key auth on proxy endpoint and pass it into the docs agent handler 2025-10-01 10:59:53 +08:00			`import type { Sandbox } from '@buster/sandbox';`
migration 2025-08-06 12:11:48 +08:00			`import { type ModelMessage, hasToolCall, stepCountIs, streamText } from 'ai';`
			`import { wrapTraced } from 'braintrust';`
			`import z from 'zod';`
routing for gateway 2025-09-03 11:21:33 +08:00			`import { DEFAULT_ANTHROPIC_OPTIONS } from '../../llm/providers/gateway';`
tons of cleanup 2025-08-08 22:03:22 +08:00			`import { Sonnet4 } from '../../llm/sonnet-4';`
moved over tools 2025-10-01 12:15:38 +08:00			`import { createIdleTool } from '../../tools';`
ls tool 2025-10-01 12:44:15 +08:00			`import { createEditFileTool, createLsTool, createMultiEditFileTool, createWriteFileTool } from '../../tools/file-tools';`
moved over tools 2025-10-01 12:15:38 +08:00			`import { createBashTool } from '../../tools/file-tools/bash-tool/bash-tool';`
			`import { createGrepTool } from '../../tools/file-tools/grep-tool/grep-tool';`
			`import { createReadFileTool } from '../../tools/file-tools/read-file-tool/read-file-tool';`
logic around reports, bug fixes, self healing, etc. 2025-08-21 00:22:35 +08:00			`import { type AgentContext, repairToolCall } from '../../utils/tool-call-repair';`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`import { getDocsAgentSystemPrompt as getAnalyticsEngineerAgentSystemPrompt } from './get-analytics-engineer-agent-system-prompt';`
starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`import type { ToolEventCallback } from './tool-events';`
refactor: rename bashExecute to executeBash for consistency - Updated the export name in index.ts and adjusted imports in the corresponding test file. - Modified the tool definition in bash-execute-tool.ts to reflect the new naming convention. 2025-07-24 00:55:03 +08:00
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`export const ANALYST_ENGINEER_AGENT_NAME = 'analyticsEngineerAgent';`
logic around reports, bug fixes, self healing, etc. 2025-08-21 00:22:35 +08:00
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`const STOP_CONDITIONS = [stepCountIs(100), hasToolCall('idleTool')];`
migration 2025-08-06 12:11:48 +08:00
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`const AnalyticsEngineerAgentOptionsSchema = z.object({`
migration 2025-08-06 12:11:48 +08:00			`folder_structure: z.string().describe('The file structure of the dbt repository'),`
Refactor Docs Agent to include additional context parameters and streamline SQL execution. Introduce user, chat, data source, organization, and optional message IDs in the DocsAgentOptions schema. Update createDocsAgent function to utilize the new context structure. Remove obsolete parseStreamingArgs function from execute-sql-docs-agent as AI SDK v5 handles streaming parsing internally. 2025-08-07 07:10:25 +08:00			`userId: z.string(),`
			`chatId: z.string(),`
			`dataSourceId: z.string(),`
			`organizationId: z.string(),`
tools updating properly 2025-08-16 05:24:05 +08:00			`messageId: z.string(),`
tons of changes 2025-08-08 06:09:45 +08:00			`sandbox: z`
			`.custom<Sandbox>(`
			`(val) => {`
			`return val && typeof val === 'object' && 'id' in val && 'fs' in val;`
			`},`
			`{ message: 'Invalid Sandbox instance' }`
			`)`
			`.optional(),`
add in api key auth on proxy endpoint and pass it into the docs agent handler 2025-10-01 10:59:53 +08:00			`model: z`
			`.custom<LanguageModelV2>()`
			`.optional()`
			`.describe('Custom language model to use (defaults to Sonnet4)'),`
migration 2025-08-06 12:11:48 +08:00			`});`

changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`const AnalyticsEngineerAgentStreamOptionsSchema = z.object({`
migration 2025-08-06 12:11:48 +08:00			`messages: z.array(z.custom<ModelMessage>()).describe('The messages to send to the docs agent'),`
refactor: rename bashExecute to executeBash for consistency - Updated the export name in index.ts and adjusted imports in the corresponding test file. - Modified the tool definition in bash-execute-tool.ts to reflect the new naming convention. 2025-07-24 00:55:03 +08:00			`});`
migration 2025-08-06 12:11:48 +08:00
starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`export type AnalyticsEngineerAgentOptions = z.infer<typeof AnalyticsEngineerAgentOptionsSchema> & {`
			`onToolEvent?: ToolEventCallback;`
			`};`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`export type AnalyticsEngineerAgentStreamOptions = z.infer<typeof AnalyticsEngineerAgentStreamOptionsSchema>;`
migration 2025-08-06 12:11:48 +08:00
ok going to make tools follow factory pattern and prepping to move chunk processor to be tool specific 2025-08-07 23:58:28 +08:00			`// Extended type for passing to tools (includes sandbox)`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`export type DocsAgentContextWithSandbox = AnalyticsEngineerAgentOptions & { sandbox: Sandbox };`
ok going to make tools follow factory pattern and prepping to move chunk processor to be tool specific 2025-08-07 23:58:28 +08:00
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`export function createAnalyticsEngineerAgent(analyticsEngineerAgentOptions: AnalyticsEngineerAgentOptions) {`
migration 2025-08-06 12:11:48 +08:00			`const systemMessage = {`
			`role: 'system',`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`content: getAnalyticsEngineerAgentSystemPrompt(analyticsEngineerAgentOptions.folder_structure),`
routing for gateway 2025-09-03 11:21:33 +08:00			`providerOptions: DEFAULT_ANTHROPIC_OPTIONS,`
migration 2025-08-06 12:11:48 +08:00			`} as ModelMessage;`

starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`const idleTool = createIdleTool({`
			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
			`});`
move write file to single and to bun based with separate prompt 2025-10-01 11:39:29 +08:00			`const writeFileTool = createWriteFileTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
write file message 2025-10-03 22:34:18 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
move write file to single and to bun based with separate prompt 2025-10-01 11:39:29 +08:00			`});`
moved over tools 2025-10-01 12:15:38 +08:00			`const grepTool = createGrepTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
moved over tools 2025-10-01 12:15:38 +08:00			`});`
			`const readFileTool = createReadFileTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
moved over tools 2025-10-01 12:15:38 +08:00			`});`
			`const bashTool = createBashTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
moved over tools 2025-10-01 12:15:38 +08:00			`});`
k tools are working properly there 2025-10-01 12:37:14 +08:00			`const editFileTool = createEditFileTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
edit file tools 2025-10-03 23:07:20 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
k tools are working properly there 2025-10-01 12:37:14 +08:00			`});`
			`const multiEditFileTool = createMultiEditFileTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
edit file tools 2025-10-03 23:07:20 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
k tools are working properly there 2025-10-01 12:37:14 +08:00			`});`
ls tool 2025-10-01 12:44:15 +08:00			`const lsTool = createLsTool({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`messageId: analyticsEngineerAgentOptions.messageId,`
			`projectDirectory: analyticsEngineerAgentOptions.folder_structure,`
starting to piece together ui for tasks 2025-10-03 22:09:09 +08:00			`onToolEvent: analyticsEngineerAgentOptions.onToolEvent,`
ls tool 2025-10-01 12:44:15 +08:00			`});`
Refactor Analyst and Think-and-Prep agents to enforce required messageId field in options schema. Update tool creation logic to streamline context handling and enhance error reporting. Introduce new execute-sql tool with improved state management and SQL execution capabilities, including delta processing and message updates. Remove deprecated execute-sql functionality and related tests. 2025-08-08 12:09:58 +08:00
refactor: introduce new planning tools for todo list and clarifications management - Added `createCheckOffTodoListTool` and `createUpdateClarificationsFileTool` to enhance planning capabilities. - Refactored existing tools to utilize the new planning tools, improving code organization and maintainability. - Updated tests to reflect changes in tool creation and execution, ensuring robust functionality. These changes streamline the management of todo lists and clarification questions, enhancing overall tool usability. 2025-08-12 00:28:26 +08:00			`// Create planning tools with simple context`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`async function stream({ messages }: AnalyticsEngineerAgentStreamOptions) {`
logic around reports, bug fixes, self healing, etc. 2025-08-21 00:22:35 +08:00			`// Collect available tools dynamically based on what's enabled`
			`const availableTools: string[] = ['sequentialThinking'];`
			`availableTools.push('executeSql');`
			`availableTools.push('updateClarificationsFile', 'checkOffTodoList', 'idleTool', 'webSearch');`

			`const agentContext: AgentContext = {`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`agentName: ANALYST_ENGINEER_AGENT_NAME,`
logic around reports, bug fixes, self healing, etc. 2025-08-21 00:22:35 +08:00			`availableTools,`
			`};`

migration 2025-08-06 12:11:48 +08:00			`return wrapTraced(`
			`() =>`
			`streamText({`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`model: analyticsEngineerAgentOptions.model \|\| Sonnet4,`
routing for gateway 2025-09-03 11:21:33 +08:00			`providerOptions: DEFAULT_ANTHROPIC_OPTIONS,`
migration 2025-08-06 12:11:48 +08:00			`tools: {`
			`idleTool,`
moved over tools 2025-10-01 12:15:38 +08:00			`grepTool,`
move write file to single and to bun based with separate prompt 2025-10-01 11:39:29 +08:00			`writeFileTool,`
moved over tools 2025-10-01 12:15:38 +08:00			`readFileTool,`
			`bashTool,`
k tools are working properly there 2025-10-01 12:37:14 +08:00			`editFileTool,`
			`multiEditFileTool,`
ls tool 2025-10-01 12:44:15 +08:00			`lsTool,`
migration 2025-08-06 12:11:48 +08:00			`},`
			`messages: [systemMessage, ...messages],`
			`stopWhen: STOP_CONDITIONS,`
			`toolChoice: 'required',`
			`maxOutputTokens: 10000,`
			`temperature: 0,`
changed agent naming to analytics engineering agent 2025-10-03 06:45:08 +08:00			`experimental_context: analyticsEngineerAgentOptions,`
logic around reports, bug fixes, self healing, etc. 2025-08-21 00:22:35 +08:00			`experimental_repairToolCall: async (repairContext) => {`
			`return repairToolCall({`
			`toolCall: repairContext.toolCall,`
			`tools: repairContext.tools,`
			`error: repairContext.error,`
			`messages: repairContext.messages,`
			`...(repairContext.system && { system: repairContext.system }),`
			`...(repairContext.inputSchema && { inputSchema: repairContext.inputSchema }),`
			`agentContext,`
			`});`
			`},`
migration 2025-08-06 12:11:48 +08:00			`}),`
			`{`
			`name: 'Docs Agent',`
			`}`
			`)();`
			`}`

			`return {`
			`stream,`
			`};`
			`}`