Improve analyze description for multiple windows

2026-04-27 15:07:41 +00:00 · 2025-06-08 04:47:52 +01:00 · 2025-06-08 04:47:52 +01:00 · b3ec918363
commit b3ec918363
parent 06cf4f144e
2 changed files with 148 additions and 3 deletions
--- a/src/tools/image.ts
+++ b/src/tools/image.ts
@ -92,6 +92,26 @@ export async function imageToolHandler(
      analysisAttempted = true;
      const analysisResults: Array<{ label: string; text: string }> = [];
      // Helper function to generate descriptive labels for analysis
      const getAnalysisLabel = (savedFile: SavedFile, isMultipleFiles: boolean): string => {
        if (!isMultipleFiles) {
          // For single files, use the item_label (app name or screen description)
          return savedFile.item_label || "Unknown";
        }
        // For multiple files, prefer window_title if available
        if (savedFile.window_title) {
          return `"${savedFile.window_title}"`;
        }
        // Fall back to item_label with window index if available
        if (savedFile.window_index !== undefined) {
          return `${savedFile.item_label || "Unknown"} (Window ${savedFile.window_index + 1})`;
        }
        return savedFile.item_label || "Unknown";
      };
      const configuredProviders = parseAIProviders(
        process.env.PEEKABOO_AI_PROVIDERS || "",
      );
@ -101,7 +121,10 @@ export async function imageToolHandler(
        logger.warn(analysisText);
      } else {
        // Iterate through all saved files for analysis
        const isMultipleFiles = captureData.saved_files.length > 1;
        for (const savedFile of captureData.saved_files) {
          const analysisLabel = getAnalysisLabel(savedFile, isMultipleFiles);
          try {
            const imageBase64 = await readImageAsBase64(savedFile.path);
            logger.debug({ path: savedFile.path }, "Image read successfully for analysis.");
@ -115,12 +138,12 @@ export async function imageToolHandler(
            if (analysisResult.error) {
              analysisResults.push({
-                label: savedFile.item_label || "Unknown",
+                label: analysisLabel,
                text: analysisResult.error,
              });
            } else {
              analysisResults.push({
-                label: savedFile.item_label || "Unknown",
+                label: analysisLabel,
                text: analysisResult.analysisText || "",
              });
              modelUsed = analysisResult.modelUsed;
@ -133,7 +156,7 @@ export async function imageToolHandler(
              "Failed to read captured image for analysis",
            );
            analysisResults.push({
-              label: savedFile.item_label || "Unknown",
+              label: analysisLabel,
              text: `Analysis skipped: Failed to read captured image at ${savedFile.path}. Error: ${readError instanceof Error ? readError.message : "Unknown read error"}`,
            });
          }
--- a/tests/unit/tools/image.test.ts
+++ b/tests/unit/tools/image.test.ts
@ -741,6 +741,128 @@ describe("Image Tool", () => {
      // Verify that the temporary directory is no longer cleaned up (files preserved)
      expect(mockFsRm).not.toHaveBeenCalled();
    });
    it("should use window titles for analysis labels when capturing multiple windows", async () => {
      // Mock resolveImagePath to return a temporary directory path
      mockResolveImagePath.mockResolvedValue({
        effectivePath: MOCK_TEMP_IMAGE_DIR,
        tempDirUsed: MOCK_TEMP_IMAGE_DIR,
      });
      // Mock executeSwiftCli with two saved files that have window titles
      const mockFile1: SavedFile = {
        path: "/tmp/peekaboo-img-XXXXXX/chrome_window1.png",
        mime_type: "image/png",
        item_label: "Google Chrome",
        window_title: "MCP Inspector",
        window_index: 0,
        window_id: 123,
      };
      const mockFile2: SavedFile = {
        path: "/tmp/peekaboo-img-XXXXXX/chrome_window2.png", 
        mime_type: "image/png",
        item_label: "Google Chrome",
        window_title: "(9) Home / X",
        window_index: 1,
        window_id: 124,
      };
      const mockResponse = {
        success: true,
        data: { saved_files: [mockFile1, mockFile2] },
        messages: ["Captured 2 Chrome windows"],
      };
      mockExecuteSwiftCli.mockResolvedValue(mockResponse);
      // Mock readImageAsBase64 to return different base64 strings
      mockReadImageAsBase64
        .mockResolvedValueOnce("base64dataforwindow1")
        .mockResolvedValueOnce("base64dataforwindow2");
      // Mock performAutomaticAnalysis to return different analysis for each call
      mockPerformAutomaticAnalysis
        .mockResolvedValueOnce({
          analysisText: "This shows the MCP Inspector interface.",
          modelUsed: MOCK_MODEL_USED,
        })
        .mockResolvedValueOnce({
          analysisText: "This shows the X (Twitter) home page.",
          modelUsed: MOCK_MODEL_USED,
        });
      // Call imageToolHandler with a question
      const result = await imageToolHandler(
        { question: "What is shown in each window?" },
        mockContext,
      );
      // Verify the final analysis_text uses window titles instead of app names
      expect(result.analysis_text).toBe(
        'Analysis for "MCP Inspector":\nThis shows the MCP Inspector interface.\n\nAnalysis for "(9) Home / X":\nThis shows the X (Twitter) home page.'
      );
      // Verify that the temporary directory is no longer cleaned up (files preserved)
      expect(mockFsRm).not.toHaveBeenCalled();
    });
    it("should fallback to window index when no window title is available", async () => {
      // Mock resolveImagePath to return a temporary directory path
      mockResolveImagePath.mockResolvedValue({
        effectivePath: MOCK_TEMP_IMAGE_DIR,
        tempDirUsed: MOCK_TEMP_IMAGE_DIR,
      });
      // Mock executeSwiftCli with two saved files without window titles
      const mockFile1: SavedFile = {
        path: "/tmp/peekaboo-img-XXXXXX/app_window1.png",
        mime_type: "image/png",
        item_label: "Some App",
        window_index: 0,
        window_id: 123,
      };
      const mockFile2: SavedFile = {
        path: "/tmp/peekaboo-img-XXXXXX/app_window2.png", 
        mime_type: "image/png",
        item_label: "Some App",
        window_index: 1,
        window_id: 124,
      };
      const mockResponse = {
        success: true,
        data: { saved_files: [mockFile1, mockFile2] },
        messages: ["Captured 2 app windows"],
      };
      mockExecuteSwiftCli.mockResolvedValue(mockResponse);
      // Mock readImageAsBase64 to return different base64 strings
      mockReadImageAsBase64
        .mockResolvedValueOnce("base64dataforwindow1")
        .mockResolvedValueOnce("base64dataforwindow2");
      // Mock performAutomaticAnalysis to return different analysis for each call
      mockPerformAutomaticAnalysis
        .mockResolvedValueOnce({
          analysisText: "Analysis for first window.",
          modelUsed: MOCK_MODEL_USED,
        })
        .mockResolvedValueOnce({
          analysisText: "Analysis for second window.",
          modelUsed: MOCK_MODEL_USED,
        });
      // Call imageToolHandler with a question
      const result = await imageToolHandler(
        { question: "What is shown in each window?" },
        mockContext,
      );
      // Verify the final analysis_text uses window index fallback
      expect(result.analysis_text).toBe(
        "Analysis for Some App (Window 1):\nAnalysis for first window.\n\nAnalysis for Some App (Window 2):\nAnalysis for second window."
      );
      // Verify that the temporary directory is no longer cleaned up (files preserved)
      expect(mockFsRm).not.toHaveBeenCalled();
    });
  });
  describe("buildSwiftCliArgs", () => {