fix: Align mostRecentFile selection with response message files

Ensures the mostRecentFile saved to chat matches what users see in response messages. Reports take priority (already displayed), followed by first extracted file. Co-Authored-By: Dallin Miner <dallin@buster.so>
2025-09-19 15:41:07 -06:00 · 2025-09-19 15:41:07 -06:00 · 2673805cd7
parent 0aaa53c685
commit 2673805cd7
3 changed files with 690 additions and 6 deletions
--- a/packages/ai/src/tools/communication-tools/done-tool/done-tool-start.test.ts
+++ b/packages/ai/src/tools/communication-tools/done-tool/done-tool-start.test.ts
@ -0,0 +1,668 @@
+import { randomUUID } from 'node:crypto';
+import { updateChat, updateMessage, updateMessageEntries } from '@buster/database/queries';
+import type { ModelMessage, ToolCallOptions } from 'ai';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import { CREATE_DASHBOARDS_TOOL_NAME } from '../../visualization-tools/dashboards/create-dashboards-tool/create-dashboards-tool';
+import { CREATE_METRICS_TOOL_NAME } from '../../visualization-tools/metrics/create-metrics-tool/create-metrics-tool';
+import { CREATE_REPORTS_TOOL_NAME } from '../../visualization-tools/reports/create-reports-tool/create-reports-tool';
+import { MODIFY_REPORTS_TOOL_NAME } from '../../visualization-tools/reports/modify-reports-tool/modify-reports-tool';
+import type { DoneToolContext, DoneToolState } from './done-tool';
+import { createDoneToolStart } from './done-tool-start';
+
+vi.mock('@buster/database/queries', () => ({
+  updateChat: vi.fn(),
+  updateMessage: vi.fn(),
+  updateMessageEntries: vi.fn(),
+}));
+
+describe('done-tool-start', () => {
+  const mockContext: DoneToolContext = {
+    chatId: 'chat-123',
+    messageId: 'message-456',
+    workflowStartTime: Date.now() - 5000,
+  };
+
+  const mockDoneToolState: DoneToolState = {
+    toolCallId: undefined,
+    args: undefined,
+    finalResponse: undefined,
+  };
+
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+
+  describe('mostRecentFile selection', () => {
+    it('should prioritize report files when present', async () => {
+      const reportId = randomUUID();
+      const metricId = randomUUID();
+      const dashboardId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'assistant',
+          content: [
+            {
+              type: 'tool-call',
+              toolName: CREATE_REPORTS_TOOL_NAME,
+              toolCallId: 'report-call',
+              input: {
+                files: [{ yml_content: 'report content with metrics' }],
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_REPORTS_TOOL_NAME,
+              toolCallId: 'report-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: reportId,
+                      name: 'Analysis Report',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metric-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId,
+                      name: 'Revenue Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_DASHBOARDS_TOOL_NAME,
+              toolCallId: 'dashboard-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: dashboardId,
+                      name: 'Sales Dashboard',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: reportId,
+        mostRecentFileType: 'report_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should use first extracted file when no reports exist', async () => {
+      const metricId1 = randomUUID();
+      const metricId2 = randomUUID();
+      const dashboardId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metric-call-1',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId1,
+                      name: 'First Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metric-call-2',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId2,
+                      name: 'Second Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_DASHBOARDS_TOOL_NAME,
+              toolCallId: 'dashboard-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: dashboardId,
+                      name: 'Dashboard',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should select the first metric (first in extractedFiles)
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: metricId1,
+        mostRecentFileType: 'metric_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should handle report with absorbed metrics correctly', async () => {
+      const reportId = randomUUID();
+      const absorbedMetricId = randomUUID();
+      const standaloneMetricId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metrics-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: absorbedMetricId,
+                      name: 'Absorbed Metric',
+                      version_number: 1,
+                    },
+                    {
+                      id: standaloneMetricId,
+                      name: 'Standalone Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: MODIFY_REPORTS_TOOL_NAME,
+              toolCallId: 'report-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  file: {
+                    id: reportId,
+                    name: 'Report with Metrics',
+                    version_number: 1,
+                    content: `<metric metricId="${absorbedMetricId}" />`,
+                  },
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Report should be selected as mostRecentFile
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: reportId,
+        mostRecentFileType: 'report_file',
+        mostRecentVersionNumber: 1,
+      });
+
+      // Verify that only the standalone metric was added as a response message
+      expect(updateMessageEntries).toHaveBeenCalledWith(
+        expect.objectContaining({
+          messageId: 'message-456',
+          responseMessages: expect.arrayContaining([
+            expect.objectContaining({
+              id: standaloneMetricId,
+              file_name: 'Standalone Metric',
+              file_type: 'metric_file',
+            }),
+          ]),
+        })
+      );
+
+      // Absorbed metric should NOT be in response messages
+      const calls = (updateMessageEntries as any).mock.calls;
+      const responseMessageCalls = calls.filter((call: any) => call[0].responseMessages);
+      for (const call of responseMessageCalls) {
+        const responseMessages = call[0].responseMessages || [];
+        expect(responseMessages.find((msg: any) => msg.id === absorbedMetricId)).toBeUndefined();
+      }
+    });
+
+    it('should use first metric when multiple metrics are created', async () => {
+      const metricId1 = randomUUID();
+      const metricId2 = randomUUID();
+      const metricId3 = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metrics-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId1,
+                      name: 'Metric 1',
+                      version_number: 1,
+                    },
+                    {
+                      id: metricId2,
+                      name: 'Metric 2',
+                      version_number: 1,
+                    },
+                    {
+                      id: metricId3,
+                      name: 'Metric 3',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should select the first metric
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: metricId1,
+        mostRecentFileType: 'metric_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should use first dashboard when multiple dashboards are created', async () => {
+      const dashboardId1 = randomUUID();
+      const dashboardId2 = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_DASHBOARDS_TOOL_NAME,
+              toolCallId: 'dashboards-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: dashboardId1,
+                      name: 'Dashboard 1',
+                      version_number: 1,
+                    },
+                    {
+                      id: dashboardId2,
+                      name: 'Dashboard 2',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should select the first dashboard
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: dashboardId1,
+        mostRecentFileType: 'dashboard_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should handle mixed metrics and dashboards correctly', async () => {
+      const metricId = randomUUID();
+      const dashboardId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        // Dashboard created first in message order
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_DASHBOARDS_TOOL_NAME,
+              toolCallId: 'dashboard-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: dashboardId,
+                      name: 'Dashboard',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        // Metric created second
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metric-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId,
+                      name: 'Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should select the dashboard (first in extractedFiles)
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: dashboardId,
+        mostRecentFileType: 'dashboard_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should handle empty file lists gracefully', async () => {
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: [],
+      } as ToolCallOptions);
+
+      // Should not call updateChat when no files exist
+      expect(updateChat).not.toHaveBeenCalled();
+    });
+
+    it('should handle only report files that are filtered out', async () => {
+      const reportId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'assistant',
+          content: [
+            {
+              type: 'tool-call',
+              toolName: CREATE_REPORTS_TOOL_NAME,
+              toolCallId: 'report-call',
+              input: {
+                files: [{ yml_content: 'simple report without metrics' }],
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_REPORTS_TOOL_NAME,
+              toolCallId: 'report-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: reportId,
+                      name: 'Simple Report',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Report should still be selected as mostRecentFile
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: reportId,
+        mostRecentFileType: 'report_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should handle dashboards with embedded metrics correctly', async () => {
+      const dashboardId = randomUUID();
+      const embeddedMetricId = randomUUID();
+      const standaloneMetricId = randomUUID();
+
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metrics-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: embeddedMetricId,
+                      name: 'Embedded Metric',
+                      version_number: 1,
+                    },
+                    {
+                      id: standaloneMetricId,
+                      name: 'Standalone Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_DASHBOARDS_TOOL_NAME,
+              toolCallId: 'dashboard-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: dashboardId,
+                      name: 'Dashboard with Metrics',
+                      version_number: 1,
+                      metric_ids: [embeddedMetricId],
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(mockContext, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should select the standalone metric (first in extractedFiles after filtering)
+      expect(updateChat).toHaveBeenCalledWith('chat-123', {
+        mostRecentFileId: standaloneMetricId,
+        mostRecentFileType: 'metric_file',
+        mostRecentVersionNumber: 1,
+      });
+    });
+
+    it('should handle context with empty chatId', async () => {
+      const contextWithEmptyChatId: DoneToolContext = {
+        messageId: mockContext.messageId,
+        chatId: '', // Empty string to simulate missing/invalid chatId
+        workflowStartTime: mockContext.workflowStartTime,
+      };
+
+      const metricId = randomUUID();
+      const mockMessages: ModelMessage[] = [
+        {
+          role: 'tool',
+          content: [
+            {
+              type: 'tool-result',
+              toolName: CREATE_METRICS_TOOL_NAME,
+              toolCallId: 'metric-call',
+              output: {
+                type: 'json',
+                value: JSON.stringify({
+                  files: [
+                    {
+                      id: metricId,
+                      name: 'Test Metric',
+                      version_number: 1,
+                    },
+                  ],
+                }),
+              },
+            },
+          ],
+        },
+      ];
+
+      const doneToolStart = createDoneToolStart(contextWithEmptyChatId, mockDoneToolState);
+      await doneToolStart({
+        toolCallId: 'done-call',
+        messages: mockMessages,
+      } as ToolCallOptions);
+
+      // Should not call updateChat when chatId is missing
+      expect(updateChat).not.toHaveBeenCalled();
+      // But should still update message entries
+      expect(updateMessageEntries).toHaveBeenCalled();
+    });
+  });
+});
--- a/packages/ai/src/tools/communication-tools/done-tool/done-tool-start.ts
+++ b/packages/ai/src/tools/communication-tools/done-tool/done-tool-start.ts
@ -4,6 +4,7 @@ import type { UpdateMessageEntriesParams } from '../../../../../database/src/que
 import { createRawToolResultEntry } from '../../shared/create-raw-llm-tool-result-entry';
 import { DONE_TOOL_NAME, type DoneToolContext, type DoneToolState } from './done-tool';
 import {
+  type ExtractedFile,
  createFileResponseMessages,
  extractAllFilesForChatUpdate,
  extractFilesFromToolCalls,
@ -68,12 +69,25 @@ export function createDoneToolStart(context: DoneToolContext, doneToolState: Don
        }
      }

-      // Update the chat with the most recent file using the full set that includes reports
-      // Do not rely on the filtered response list since it excludes report files
+      // Update the chat with the most recent file
+      // Priority: Reports (already in responses) > First extracted file > Any file
      if (context.chatId && allFilesForChatUpdate.length > 0) {
-        const mostRecentFile =
-          allFilesForChatUpdate.find((f) => f.fileType === 'report_file') ||
-          allFilesForChatUpdate[0];
+        let mostRecentFile: ExtractedFile | undefined;
+
+        // Priority 1: Report files (they're already in response messages)
+        const reportFile = allFilesForChatUpdate.find((f) => f.fileType === 'report_file');
+        if (reportFile) {
+          mostRecentFile = reportFile;
+        }
+        // Priority 2: First file from extractedFiles (metrics/dashboards being added as responses)
+        else if (extractedFiles.length > 0) {
+          mostRecentFile = extractedFiles[0];
+        }
+        // Priority 3: Fallback to any file from allFilesForChatUpdate
+        else {
+          mostRecentFile = allFilesForChatUpdate[0];
+        }
+
        if (mostRecentFile) {
          console.info('[done-tool-start] Updating chat with most recent file', {
            chatId: context.chatId,
@ -81,6 +95,8 @@ export function createDoneToolStart(context: DoneToolContext, doneToolState: Don
            fileType: mostRecentFile.fileType,
            fileName: mostRecentFile.fileName,
            versionNumber: mostRecentFile.versionNumber,
+            wasFromExtracted: extractedFiles.some((f) => f.id === mostRecentFile.id),
+            wasReport: mostRecentFile.fileType === 'report_file',
          });

          try {
--- a/packages/ai/src/tools/communication-tools/done-tool/helpers/done-tool-file-selection.ts
+++ b/packages/ai/src/tools/communication-tools/done-tool/helpers/done-tool-file-selection.ts
@ -47,7 +47,7 @@ interface ToolFileInfo {
 }

 // File tracking type
-interface ExtractedFile {
+export interface ExtractedFile {
  id: string;
  fileType: 'metric_file' | 'dashboard_file' | 'report_file';
  fileName: string;