refactor: update action method return type to include Coordinate

danyalxahid-askui · danyalxahid-askui · commit cd4d4e82647b · 2025-07-24T21:33:13.000+02:00
- Modified the return type of the `action` method in `Computer20250124Tool` to include `Coordinate` in addition to `Image.Image | None`, enhancing its functionality to return more comprehensive results.
diff --git a/src/askui/tools/computer.py b/src/askui/tools/computer.py
@@ -4,16 +4,20 @@
 from dataclasses import dataclass
 from typing import Annotated, Literal, TypedDict, cast, get_args
 
-from anthropic.types.beta import (BetaToolComputerUse20241022Param,
-                                  BetaToolComputerUse20250124Param)
+from anthropic.types.beta import (
+    BetaToolComputerUse20241022Param,
+    BetaToolComputerUse20250124Param,
+)
 from PIL import Image
 from pydantic import Field, validate_call
 from typing_extensions import Self, override
 
 from askui.tools.agent_os import AgentOs, Coordinate, ModifierKey, PcKey
-from askui.utils.image_utils import (scale_coordinates_back,
-                                     scale_coordinates_with_padding,
-                                     scale_image_with_padding)
+from askui.utils.image_utils import (
+    scale_coordinates_back,
+    scale_coordinates_with_padding,
+    scale_image_with_padding,
+)
 
 from ..models.shared.tools import InputSchema, Tool
 
@@ -325,11 +329,17 @@ def _screenshot(self) -> Image.Image:
         self._real_screen_height = screenshot.height
         return scale_image_with_padding(screenshot, self._width, self._height)
 
-
     def _get_mouse_position_scaled(self) -> Coordinate:
         mouse_position: Coordinate = self._agent_os.get_mouse_position()
         real_screen_width, real_screen_height = self._get_real_screen_resolution()
-        x, y = scale_coordinates_with_padding(mouse_position.x, mouse_position.y, real_screen_width, real_screen_height, self._width, self._height)
+        x, y = scale_coordinates_with_padding(
+            mouse_position.x,
+            mouse_position.y,
+            real_screen_width,
+            real_screen_height,
+            self._width,
+            self._height,
+        )
         return Coordinate(x=int(x), y=int(y))
 
 
@@ -433,7 +443,7 @@ def __call__(  # noqa: C901
         scroll_amount: Annotated[int, Field(ge=0)] | None = None,
         duration: Annotated[float, Field(ge=0.0, le=100.0)] | None = None,
         key: str | None = None,  # maybe not all keys supported
-    ) -> Image.Image | None:
+    ) -> Image.Image | None | Coordinate:
         match action:
             case "hold_key":
                 self._hold_key(keystroke=text, duration=duration)  # type: ignore[arg-type]
diff --git a/src/askui/utils/image_utils.py b/src/askui/utils/image_utils.py
@@ -7,9 +7,8 @@
 from pathlib import Path
 from typing import Any, Literal, Tuple, Union
 
-from PIL import Image
+from PIL import Image, ImageDraw, ImageOps, UnidentifiedImageError
 from PIL import Image as PILImage
-from PIL import ImageDraw, ImageOps, UnidentifiedImageError
 from pydantic import ConfigDict, RootModel, field_validator
 
 # Regex to capture any kind of valid base64 data url (with optional media type and ;base64)
@@ -233,16 +232,10 @@ def scale_coordinates_with_padding(
     scaled_x = x * scale_factor + pad_left
     scaled_y = y * scale_factor + pad_top
 
-    if (
-        scaled_x < 0
-        or scaled_y < 0
-        or scaled_x > max_width
-        or scaled_y > max_height
-    ):
+    if scaled_x < 0 or scaled_y < 0 or scaled_x > max_width or scaled_y > max_height:
         error_msg = "Coordinates are outside the padded image area"
         raise ValueError(error_msg)
 
-
     return scaled_x, scaled_y