diff --git a/vision_agent/agent/vision_agent.py b/vision_agent/agent/vision_agent.py index e6f5818d..514f8fa5 100644 --- a/vision_agent/agent/vision_agent.py +++ b/vision_agent/agent/vision_agent.py @@ -380,7 +380,6 @@ def sample_n_evenly_spaced(lst: Sequence, n: int) -> Sequence: return [lst[round(spacing * i)] for i in range(n)] - def visualize_result(all_tool_results: List[Dict]) -> Sequence[Union[str, Path]]: image_to_data: Dict[str, Dict] = {} for tool_result in all_tool_results: diff --git a/vision_agent/lmm/lmm.py b/vision_agent/lmm/lmm.py index a1fcc3c2..cc8861bd 100644 --- a/vision_agent/lmm/lmm.py +++ b/vision_agent/lmm/lmm.py @@ -9,10 +9,7 @@ import requests from openai import AzureOpenAI, OpenAI -from vision_agent.tools import ( - CHOOSE_PARAMS, - SYSTEM_PROMPT, -) +from vision_agent.tools import CHOOSE_PARAMS, SYSTEM_PROMPT _LOGGER = logging.getLogger(__name__) diff --git a/vision_agent/tools/__init__.py b/vision_agent/tools/__init__.py index 60870b56..10daf7eb 100644 --- a/vision_agent/tools/__init__.py +++ b/vision_agent/tools/__init__.py @@ -12,12 +12,12 @@ GroundingDINO, GroundingSAM, ImageCaption, - ZeroShotCounting, - VisualPromptCounting, - VisualQuestionAnswering, ImageQuestionAnswering, SegArea, SegIoU, Tool, + VisualPromptCounting, + VisualQuestionAnswering, + ZeroShotCounting, register_tool, ) diff --git a/vision_agent/tools/tools.py b/vision_agent/tools/tools.py index 3bf2bfbf..32a998db 100644 --- a/vision_agent/tools/tools.py +++ b/vision_agent/tools/tools.py @@ -17,9 +17,9 @@ normalize_bbox, rle_decode, ) +from vision_agent.lmm import OpenAILMM from vision_agent.tools.video import extract_frames_from_video from vision_agent.type_defs import LandingaiAPIKey -from vision_agent.lmm import OpenAILMM _LOGGER = logging.getLogger(__name__) _LND_API_KEY = LandingaiAPIKey().api_key