From 8a8c5d1dacb159418ae4b72877624532a9ee20ee Mon Sep 17 00:00:00 2001 From: Dayanne Fernandes Date: Thu, 3 Oct 2024 22:49:10 -0300 Subject: [PATCH] fix video-temporal-localization --- vision_agent/tools/tools.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/vision_agent/tools/tools.py b/vision_agent/tools/tools.py index 35d8487f..6943a0ff 100644 --- a/vision_agent/tools/tools.py +++ b/vision_agent/tools/tools.py @@ -899,7 +899,10 @@ def ixc25_temporal_localization(prompt: str, frames: List[np.ndarray]) -> List[b "function_name": "ixc25_temporal_localization", } data: List[int] = send_inference_request( - payload, "video-temporal-localization", files=files, v2=True + payload, + "video-temporal-localization?model=internlm-xcomposer", + files=files, + v2=True, ) chunk_size = round(len(frames) / len(data)) data_explode = [[elt] * chunk_size for elt in data]