diff --git a/vision_agent/lmm/types.py b/vision_agent/lmm/types.py index ba2b3189..b9c99fe2 100644 --- a/vision_agent/lmm/types.py +++ b/vision_agent/lmm/types.py @@ -1,5 +1,6 @@ from pathlib import Path from typing import Dict, Sequence, Union + from vision_agent.utils.execute import Execution TextOrImage = Union[str, Sequence[Union[str, Path]]] diff --git a/vision_agent/tools/__init__.py b/vision_agent/tools/__init__.py index cbd92358..e82d7553 100644 --- a/vision_agent/tools/__init__.py +++ b/vision_agent/tools/__init__.py @@ -21,8 +21,8 @@ dpt_hybrid_midas, extract_frames, florence2_image_caption, - florence2_phrase_grounding, florence2_ocr, + florence2_phrase_grounding, florence2_roberta_vqa, florence2_sam2_image, florence2_sam2_video,