diff --git a/vision_agent/tools/__init__.py b/vision_agent/tools/__init__.py index 43460fbd..90858569 100644 --- a/vision_agent/tools/__init__.py +++ b/vision_agent/tools/__init__.py @@ -16,6 +16,8 @@ clip, closest_box_distance, closest_mask_distance, + countgd_counting, + countgd_example_based_counting, depth_anything_v2, detr_segmentation, dpt_hybrid_midas, @@ -30,6 +32,8 @@ generate_soft_edge_image, get_tool_documentation, git_vqa_v2, + gpt4o_image_vqa, + gpt4o_video_vqa, grounding_dino, grounding_sam, ixc25_image_vqa, @@ -37,13 +41,11 @@ load_image, loca_visual_prompt_counting, loca_zero_shot_counting, - countgd_counting, - countgd_example_based_counting, ocr, overlay_bounding_boxes, + overlay_counting_results, overlay_heat_map, overlay_segmentation_masks, - overlay_counting_results, owl_v2, save_image, save_json, diff --git a/vision_agent/tools/tool_utils.py b/vision_agent/tools/tool_utils.py index a14443bd..67306c9d 100644 --- a/vision_agent/tools/tool_utils.py +++ b/vision_agent/tools/tool_utils.py @@ -1,6 +1,6 @@ -import os import inspect import logging +import os from typing import Any, Callable, Dict, List, MutableMapping, Optional, Tuple import pandas as pd @@ -10,10 +10,10 @@ from requests.adapters import HTTPAdapter from urllib3.util.retry import Retry +from vision_agent.tools.tools_types import BoundingBoxes from vision_agent.utils.exceptions import RemoteToolCallFailed from vision_agent.utils.execute import Error, MimeType from vision_agent.utils.type_defs import LandingaiAPIKey -from vision_agent.tools.tools_types import BoundingBoxes _LOGGER = logging.getLogger(__name__) _LND_API_KEY = os.environ.get("LANDINGAI_API_KEY", LandingaiAPIKey().api_key) diff --git a/vision_agent/tools/tools_types.py b/vision_agent/tools/tools_types.py index f61c2cf1..6ebcf468 100644 --- a/vision_agent/tools/tools_types.py +++ b/vision_agent/tools/tools_types.py @@ -1,8 +1,8 @@ from enum import Enum +from typing import List, Optional, Tuple, Union from uuid import UUID -from typing import List, Tuple, Optional, Union -from pydantic import BaseModel, ConfigDict, Field, field_serializer, SerializationInfo +from pydantic import BaseModel, ConfigDict, Field, SerializationInfo, field_serializer class BboxInput(BaseModel):