diff --git a/vision_agent/tools/tool_types.py b/vision_agent/tools/tool_types.py index c575cec8..8ab55ffe 100644 --- a/vision_agent/tools/tool_types.py +++ b/vision_agent/tools/tool_types.py @@ -1,13 +1,13 @@ -from typing import List, Tuple +from typing import List, Tuple, Literal -from nptyping import UInt8, NDArray, Shape +from nptyping import UInt8, NDArray from pydantic import BaseModel, ConfigDict class BboxInput(BaseModel): model_config = ConfigDict(arbitrary_types_allowed=True) - image: NDArray[Shape["Height, Width, 3"], UInt8] + image: NDArray[Literal["Height, Width, 3"], UInt8] filename: str labels: List[str] bboxes: List[Tuple[int, int, int, int]] diff --git a/vision_agent/tools/tools.py b/vision_agent/tools/tools.py index 6e323b79..fc5a6d72 100644 --- a/vision_agent/tools/tools.py +++ b/vision_agent/tools/tools.py @@ -879,6 +879,7 @@ def generate_pose_image(image: np.ndarray) -> np.ndarray: data = { "image": image_b64, "tool": "generate_pose", + "function_name": "generate_pose_image", } answer = send_inference_request(data, "tools")