screen cap tool in readme

cagostino · cagostino · commit 28ecb5d210bc · 2025-03-20T01:20:09.000-04:00
diff --git a/README.md b/README.md
@@ -1337,40 +1337,33 @@ Tools are defined as YAMLs with `.tool` extension within the npc_team/tools dire
 Here is an example of a tool file:
 ```yaml
 tool_name: "screen_capture_analysis_tool"
+description: Captures the whole screen and sends the image for analysis
 inputs:
   - "prompt"
-preprocess:
+steps:
   - engine: "python"
     code: |
       # Capture the screen
       import pyautogui
       import datetime
       import os
       from PIL import Image
-      from npcsh.image import analyze_image_base
-
-      # Generate filename
-      filename = f"screenshot_{datetime.datetime.now().strftime('%Y%m%d_%H%M%S')}.png"
-      screenshot = pyautogui.screenshot()
-      screenshot.save(filename)
-      print(f"Screenshot saved as {filename}")
-
-      # Load image
-      image = Image.open(filename)
-
-      # Full file path
-      file_path = os.path.abspath('./'+filename)
-      # Analyze the image
-
-      llm_output = analyze_image_base(inputs['prompt']+ '\n\n attached is a screenshot of my screen currently.', file_path, filename, npc=npc)
-prompt:
-  engine: "natural"
-  code: ""
-postprocess:
-  - engine: "natural"
-    code: |
-      Screenshot captured and saved as {{ filename }}.
-      Analysis Result: {{ llm_output }}
+      import time
+      from npcsh.image import analyze_image_base, capture_screenshot
+
+      out = capture_screenshot(npc = npc, full = True)
+
+      llm_response = analyze_image_base( '{{prompt}}' + "\n\nAttached is a screenshot of my screen currently. Please use this to evaluate the situation. If the user asked for you to explain what's on their screen or something similar, they are referring to the details contained within the attached image. You do not need to actually view their screen. You do not need to mention that you cannot view or interpret images directly. You only need to answer the user's request based on the attached screenshot!",
+                                        out['file_path'],
+                                        out['filename'],
+                                        npc=npc,
+                                        **out['model_kwargs'])
+      # To this:
+      if isinstance(llm_response, dict):
+          llm_response = llm_response.get('response', 'No response from image analysis')
+      else:
+          llm_response = 'No response from image analysis'
+
 ```