VideoSimpleQA / utils /count_frames.py
hzy's picture
Initial upload of all project files
608eb1a verified
import json
with open(
"/mnt/bn/ziyang-storage-cloudnative-hl/VideoSimpleQA/o4-mini-2025-04-16_lvbench_agent_results.json",
"r",
) as f:
data = json.load(f)
# print(data[0])
# import pdb; pdb.set_trace()
# print(data[1])
frames_count = []
# for d in data:
# num_frames = 0
# for turn in d["agent_conversation"]:
# if turn["role"] == "assistant" and turn["tool_calls"]:
# for tool_call in turn["tool_calls"]:
# frame_ids = json.loads(tool_call["function"]["arguments"])["frame_ids"]
# num_frames += len(frame_ids)
# frames_count.append(num_frames)
for d in data:
num_frames = 0
for turn in d["agent_conversation"]:
if turn["role"] == "user" and type(turn['content']) == list:
for item in turn['content']:
if item['type'] == 'image_url':
num_frames += 1
frames_count.append(num_frames)
print(f"mean frames: {sum(frames_count) / len(frames_count)}")
print(f"max frames: {max(frames_count)}")
print(f"min frames: {min(frames_count)}")