结果可视化
定义mark_vedio方法。基于提供的视频标记区域,将带时间戳的句级文本序列与视频帧匹配,并在视频中标记相应区域。使用了OpenCV库来处理视频帧,并在特定时间范围内绘制矩形和文本以标记指定区域。
def mark_video(input_video_path, output_video_path, matches):
cap = cv2.VideoCapture(input_video_path)
fps = cap.get(cv2.CAP_PROP_FPS)
frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))
frame_count = 0
current_region = None
current_kp_id = None
region_end_time = None
while cap.isOpened():
ret, frame = cap.read()
if not ret:
break
timestamp = int(frame_count / fps * 1000) # Convert frame count to milliseconds
for match in matches:
start_time, end_time, region, kp_id = match
if start_time <= timestamp <= end_time:
current_region = region
current_kp_id = kp_id
region_end_time = end_time
break
if current_region:
cv2.rectangle(frame, (current_region[0], current_region[1]), (current_region[2], current_region[3]), (0, 255, 0), 2)
cv2.putText(frame, current_kp_id, (current_region[0], current_region[1] - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
out.write(frame)
frame_count += 1
cap.release()
out.release()
用上面定义的方法读取视频文件,对其进行处理并标记视频中的相关区域,然后将处理后的视频保存到输出文件夹中。即可完成可视化工作
for video in videos.unique():
video_file_path = f'{video_folder_path}{video}.avi' # 构建视频文件的完整路径
if not os.path.exists(video_file_path):
print(f"Video file not found: {video_file_path}")
continue
cap = cv2.VideoCapture('5_match.mp4')
# if not cap.isOpened():
# print(f"Failed to open video: {video_file_path}")
# continue
# 获取视频的帧率和分辨率
fps = cap.get(cv2.CAP_PROP_FPS)
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(f'{output_video_path}{video}_processed.mp4', fourcc, fps, (width, height))
frame_count = 0
while cap.isOpened():
ret, frame = cap.read()
if not ret:
break
current_time = frame_count / fps
relevant_data = timestamps[(timestamps >= current_time) & (timestamps < current_time + 1 / fps)]
for i in relevant_data.index:
if videos[i] != video:
continue
x, y = positions.loc[i, [0, 1]]
# x = int(x + frame.shape[1] / 2) # Adjust x to center
# y = int(frame.shape[0] / 2 - y) # Adjust y to center
x = int(x)
y = int(-y)
# Draw the gaze point
cv2.circle(frame, (x, y), 10, (0, 0, 255), -1)
out.write(frame)
frame_count += 1
# 在视频末尾添加空白帧以确保输出视频长度与原视频一致
while frame_count < total_frames:
ret, frame = cap.read()
if not ret:
break
out.write(frame)
frame_count += 1
cap.release()
out.release()
print(f"Processed video saved: {video}_processed.mp4")
print("所有视频处理完成!")