diff --git a/vision_agent/agent/vision_agent.py b/vision_agent/agent/vision_agent.py index 29e9dee6..2c7febf5 100644 --- a/vision_agent/agent/vision_agent.py +++ b/vision_agent/agent/vision_agent.py @@ -14,13 +14,7 @@ VA_CODE, ) from vision_agent.lmm import LMM, AnthropicLMM, Message, OpenAILMM -from vision_agent.tools import ( - META_TOOL_DOCSTRING, - extract_frames, - load_image, - save_image, - save_video, -) +from vision_agent.tools import META_TOOL_DOCSTRING from vision_agent.tools.meta_tools import ( Artifacts, check_and_load_image, diff --git a/vision_agent/agent/vision_agent_coder.py b/vision_agent/agent/vision_agent_coder.py index 2efc7a50..2d29a8bf 100644 --- a/vision_agent/agent/vision_agent_coder.py +++ b/vision_agent/agent/vision_agent_coder.py @@ -2,12 +2,10 @@ import logging import os import sys -import tempfile from json import JSONDecodeError from pathlib import Path from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple, Union, cast -from PIL import Image from rich.console import Console from rich.style import Style from rich.syntax import Syntax @@ -776,11 +774,11 @@ def chat_with_workflow( verbosity=self.verbosity, ) best_plan = plan_thoughts["best_plan"] - plan_thoughts = plan_thoughts["thoughts"] + plan_thoughts_str = plan_thoughts["thoughts"] else: best_plan = list(plans.keys())[0] tool_output_str = "" - plan_thoughts = "" + plan_thoughts_str = "" if best_plan in plans and best_plan in tool_infos: plan_i = plans[best_plan] @@ -815,7 +813,7 @@ def chat_with_workflow( + "\n-".join([e for e in plan_i["instructions"]]), tool_info=tool_info, tool_output=tool_output_str, - plan_thoughts=plan_thoughts, + plan_thoughts=plan_thoughts_str, tool_utils=T.UTILITIES_DOCSTRING, working_memory=working_memory, coder=self.coder,