Skip to content

Commit 31a0ef7

Browse files
pufanyikcz358
authored andcommitted
if no response directly return 0 (#142)
1 parent 1f73767 commit 31a0ef7

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

lmms_eval/tasks/live_bench/utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -166,8 +166,8 @@ def livebench_process_results_for_name(doc, results, model, eval_name):
166166
if subtask not in SUBTASKS:
167167
subtask = "further insights"
168168
if not results or results[0] == "":
169-
return {eval_name: {"rating": 0, "explanation": "No response", "model_name": "N/A", "subtask": subtask}}
170-
rating, explanation, model_name = get_chat_response(gpt_model_name=model, base64_images=base64_images, question=doc["question"], ground_truth_answer=doc["answer"], answer=results[0] if results else "", criteria=criteria)
169+
return {"gpt4_eval_score": {"rating": 0, "explanation": "No response", "model_name": "N/A", "subtask": subtask}}
170+
rating, explanation, model_name = get_chat_response(base64_images=base64_images, question=doc["question"], ground_truth_answer=doc["answer"], answer=results[0] if results else "", criteria=criteria)
171171
if rating >= 0:
172172
return {eval_name: {"rating": rating, "explanation": explanation, "model_name": model_name, "subtask": subtask, "id": doc["id"]}}
173173
else:

0 commit comments

Comments
 (0)