Spaces:
Sleeping
Sleeping
import cv2 | |
import numpy as np | |
import torch | |
from ultralytics import YOLO | |
import gradio as gr | |
from scipy.interpolate import interp1d | |
import uuid | |
import os | |
try: | |
from OpenGL.GL import * | |
from OpenGL.GLU import * | |
from pygame import display, event, QUIT | |
HAS_OPENGL = True | |
except ImportError: | |
print("Warning: PyOpenGL or Pygame not found. 3D visualization will be disabled. Install with 'pip install PyOpenGL PyOpenGL_accelerate pygame'.") | |
HAS_OPENGL = False | |
# Load the trained YOLOv8n model | |
model = YOLO("best.pt") | |
# Constants | |
STUMPS_WIDTH = 0.2286 # meters | |
FRAME_RATE = 20 | |
SLOW_MOTION_FACTOR = 2 | |
CONF_THRESHOLD = 0.3 | |
PITCH_ZONE_Y = 0.8 | |
IMPACT_ZONE_Y = 0.7 | |
IMPACT_DELTA_Y = 20 | |
STUMPS_HEIGHT = 0.711 # meters | |
PITCH_LENGTH = 20.12 # meters (22 yards) | |
def process_video(video_path): | |
if not os.path.exists(video_path): | |
return [], [], [], "Error: Video file not found" | |
cap = cv2.VideoCapture(video_path) | |
frames = [] | |
ball_positions = [] | |
detection_frames = [] | |
debug_log = [] | |
frame_count = 0 | |
while cap.isOpened(): | |
ret, frame = cap.read() | |
if not ret: | |
break | |
frames.append(frame.copy()) | |
frame = cv2.convertScaleAbs(frame, alpha=1.2, beta=10) | |
results = model.predict(frame, conf=CONF_THRESHOLD) | |
detections = [det for det in results[0].boxes if det.cls == 0] | |
if len(detections) == 1: | |
x1, y1, x2, y2 = detections[0].xyxy[0].cpu().numpy() | |
ball_positions.append([(x1 + x2) / 2, (y1 + y2) / 2]) | |
detection_frames.append(len(frames) - 1) | |
cv2.rectangle(frame, (int(x1), int(y1)), (int(x2), int(y2)), (0, 255, 0), 2) | |
frames[-1] = frame | |
debug_log.append(f"Frame {frame_count}: {len(detections)} ball detections") | |
frame_count += 1 | |
cap.release() | |
if not ball_positions: | |
debug_log.append("No valid single-ball detections in any frame") | |
else: | |
debug_log.append(f"Total valid single-ball detections: {len(ball_positions)}") | |
return frames, ball_positions, detection_frames, "\n".join(debug_log) | |
def estimate_trajectory_3d(ball_positions, detection_frames, frames): | |
if len(ball_positions) < 2: | |
return None, None, None, None, None, None, "Error: Fewer than 2 valid single-ball detections" | |
frame_height, frame_width = frames[0].shape[:2] | |
x_coords = np.array([pos[0] for pos in ball_positions]) / frame_width * PITCH_LENGTH | |
y_coords = np.array([frame_height - pos[1] for pos in ball_positions]) / frame_height * STUMPS_HEIGHT * 2 | |
z_coords = np.zeros_like(x_coords) # Placeholder for depth | |
times = np.array([i / FRAME_RATE for i in range(len(ball_positions))]) | |
pitch_idx = 0 | |
for i, y in enumerate(y_coords): | |
if y < STUMPS_HEIGHT: | |
pitch_idx = i | |
break | |
pitch_point = (x_coords[pitch_idx], y_coords[pitch_idx], 0) | |
pitch_frame = detection_frames[pitch_idx] | |
impact_idx = None | |
for i in range(1, len(y_coords)): | |
if (y_coords[i] > STUMPS_HEIGHT and | |
abs(y_coords[i] - y_coords[i-1]) > IMPACT_DELTA_Y * STUMPS_HEIGHT / frame_height): | |
impact_idx = i | |
break | |
if impact_idx is None: | |
impact_idx = len(y_coords) - 1 | |
impact_point = (x_coords[impact_idx], y_coords[impact_idx], 0) | |
impact_frame = detection_frames[impact_idx] | |
# Use cubic interpolation to avoid derivative mismatch | |
try: | |
fx = interp1d(times[:impact_idx + 1], x_coords[:impact_idx + 1], kind='cubic', fill_value="extrapolate") | |
fy = interp1d(times[:impact_idx + 1], y_coords[:impact_idx + 1], kind='cubic', fill_value="extrapolate") | |
fz = interp1d(times[:impact_idx + 1], z_coords[:impact_idx + 1], kind='cubic', fill_value="extrapolate") | |
except ValueError as e: | |
# Fallback to linear if cubic fails (e.g., too few points) | |
fx = interp1d(times[:impact_idx + 1], x_coords[:impact_idx + 1], kind='linear', fill_value="extrapolate") | |
fy = interp1d(times[:impact_idx + 1], y_coords[:impact_idx + 1], kind='linear', fill_value="extrapolate") | |
fz = interp1d(times[:impact_idx + 1], z_coords[:impact_idx + 1], kind='linear', fill_value="extrapolate") | |
print(f"Warning: Cubic interpolation failed, falling back to linear. Error: {str(e)}") | |
t_full = np.linspace(times[0], times[impact_idx] + 0.5, 50) | |
full_trajectory = list(zip(fx(t_full), fy(t_full), fz(t_full))) | |
vis_trajectory = list(zip(x_coords, y_coords, z_coords))[:impact_idx + 1] | |
return full_trajectory, vis_trajectory, pitch_point, pitch_frame, impact_point, impact_frame, "Trajectory estimated" | |
def lbw_decision(ball_positions, full_trajectory, frames, pitch_point, impact_point): | |
if not frames or not full_trajectory: | |
return "Error: No data", None, None, None | |
frame_height, frame_width = frames[0].shape[:2] | |
stumps_x = PITCH_LENGTH / 2 | |
stumps_y = 0 | |
stumps_width = STUMPS_WIDTH | |
pitch_x, pitch_y, _ = pitch_point | |
impact_x, impact_y, _ = impact_point | |
in_line_threshold = stumps_width / 2 | |
if abs(pitch_x - stumps_x) > in_line_threshold: | |
return f"Not Out (Pitched outside line at x: {pitch_x:.1f})", full_trajectory, pitch_point, impact_point | |
if abs(impact_x - stumps_x) > in_line_threshold or impact_y < stumps_y: | |
return f"Not Out (Impact outside line at x: {impact_x:.1f})", full_trajectory, pitch_point, impact_point | |
hit_stumps = False | |
for x, y, z in full_trajectory: | |
if (abs(x - stumps_x) < in_line_threshold and | |
abs(y - stumps_y) < STUMPS_HEIGHT / 2): | |
hit_stumps = True | |
break | |
if hit_stumps: | |
if abs(x - stumps_x) < in_line_threshold * 0.1: | |
return f"Umpire's Call - Not Out", full_trajectory, pitch_point, impact_point | |
return f"Out (Ball hits stumps)", full_trajectory, pitch_point, impact_point | |
return f"Not Out (Missing stumps)", full_trajectory, pitch_point, impact_point | |
def generate_slow_motion(frames, vis_trajectory, pitch_point, pitch_frame, impact_point, impact_frame, detection_frames, output_path, decision, frame_width, frame_height): | |
if not frames: | |
return None | |
fourcc = cv2.VideoWriter_fourcc(*'mp4v') | |
out = cv2.VideoWriter(output_path, fourcc, FRAME_RATE / SLOW_MOTION_FACTOR, (frame_width, frame_height)) | |
trajectory_points = np.array([[p[0] * frame_width / PITCH_LENGTH, frame_height - (p[1] * frame_height / (STUMPS_HEIGHT * 2))] for p in vis_trajectory], dtype=np.int32).reshape((-1, 1, 2)) | |
for i, frame in enumerate(frames): | |
# Draw stumps outline (scaled back to pixel coordinates) | |
stumps_x = frame_width / 2 | |
stumps_y = frame_height * 0.8 | |
stumps_width_pixels = frame_width * (STUMPS_WIDTH / PITCH_LENGTH) | |
stumps_height_pixels = frame_height * (STUMPS_HEIGHT / (STUMPS_HEIGHT * 2)) | |
cv2.line(frame, (int(stumps_x - stumps_width_pixels / 2), int(stumps_y)), | |
(int(stumps_x + stumps_width_pixels / 2), int(stumps_y)), (255, 255, 255), 2) | |
cv2.line(frame, (int(stumps_x - stumps_width_pixels / 2), int(stumps_y - stumps_height_pixels)), | |
(int(stumps_x - stumps_width_pixels / 2), int(stumps_y)), (255, 255, 255), 2) | |
cv2.line(frame, (int(stumps_x + stumps_width_pixels / 2), int(stumps_y - stumps_height_pixels)), | |
(int(stumps_x + stumps_width_pixels / 2), int(stumps_y)), (255, 255, 255), 2) | |
# Draw crease line | |
cv2.line(frame, (int(stumps_x - stumps_width_pixels / 2), int(stumps_y)), | |
(int(stumps_x + stumps_width_pixels / 2), int(stumps_y)), (255, 255, 0), 2) | |
if i in detection_frames and trajectory_points.size > 0: | |
idx = detection_frames.index(i) + 1 | |
if idx <= len(trajectory_points): | |
cv2.polylines(frame, [trajectory_points[:idx]], False, (0, 0, 255), 2) # Blue trajectory | |
if pitch_point and i == pitch_frame: | |
x = pitch_point[0] * frame_width / PITCH_LENGTH | |
y = frame_height - (pitch_point[1] * frame_height / (STUMPS_HEIGHT * 2)) | |
cv2.circle(frame, (int(x), int(y)), 8, (0, 255, 0), -1) # Green for pitching | |
cv2.putText(frame, "Pitching", (int(x) + 10, int(y) - 10), | |
cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 1) | |
if impact_point and i == impact_frame: | |
x = impact_point[0] * frame_width / PITCH_LENGTH | |
y = frame_height - (impact_point[1] * frame_height / (STUMPS_HEIGHT * 2)) | |
cv2.circle(frame, (int(x), int(y)), 8, (0, 0, 255), -1) # Red for impact | |
cv2.putText(frame, "Impact", (int(x) + 10, int(y) + 20), | |
cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1) | |
if impact_point and i == impact_frame and "Out" in decision: | |
cv2.putText(frame, "Wickets", (int(stumps_x) - 50, int(stumps_y) - 20), | |
cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 165, 255), 1) # Orange for wickets | |
for _ in range(SLOW_MOTION_FACTOR): | |
out.write(frame) | |
out.release() | |
return output_path | |
def draw_3d_scene(trajectory, pitch_point, impact_point, decision): | |
if not HAS_OPENGL: | |
return | |
glClear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT) | |
glBegin(GL_LINES) | |
for i in range(len(trajectory) - 1): | |
glColor3f(0, 0, 1) # Blue trajectory | |
glVertex3f(trajectory[i][0], trajectory[i][1], trajectory[i][2]) | |
glVertex3f(trajectory[i + 1][0], trajectory[i + 1][1], trajectory[i + 1][2]) | |
glEnd() | |
glColor3f(0, 1, 0) # Green pitch | |
glBegin(GL_QUADS) | |
glVertex3f(0, 0, 0) | |
glVertex3f(PITCH_LENGTH, 0, 0) | |
glVertex3f(PITCH_LENGTH, 0, -1) | |
glVertex3f(0, 0, -1) | |
glEnd() | |
glColor3f(1, 1, 1) # White stumps | |
glBegin(GL_LINES) | |
glVertex3f(PITCH_LENGTH / 2 - STUMPS_WIDTH / 2, 0, 0) | |
glVertex3f(PITCH_LENGTH / 2 - STUMPS_WIDTH / 2, STUMPS_HEIGHT, 0) | |
glVertex3f(PITCH_LENGTH / 2 + STUMPS_WIDTH / 2, 0, 0) | |
glVertex3f(PITCH_LENGTH / 2 + STUMPS_WIDTH / 2, STUMPS_HEIGHT, 0) | |
glEnd() | |
if pitch_point: | |
glColor3f(0, 1, 0) # Green | |
glPushMatrix() | |
glTranslatef(pitch_point[0], pitch_point[1], pitch_point[2]) | |
glutSolidSphere(0.1, 20, 20) | |
glPopMatrix() | |
if impact_point: | |
glColor3f(1, 0, 0) # Red | |
glPushMatrix() | |
glTranslatef(impact_point[0], impact_point[1], impact_point[2]) | |
glutSolidSphere(0.1, 20, 20) | |
glPopMatrix() | |
if "Out" in decision: | |
glColor3f(1, 0.65, 0) # Orange | |
glRasterPos3f(PITCH_LENGTH / 2, STUMPS_HEIGHT, 0) | |
for char in "Wickets": | |
glutBitmapCharacter(GLUT_BITMAP_HELVETICA_12, ord(char)) | |
display.flip() | |
def init_3d_window(width, height): | |
if not HAS_OPENGL: | |
return | |
pygame.init() | |
display.set_mode((width, height), DOUBLEBUF | OPENGL) | |
gluPerspective(45, (width / height), 0.1, 50.0) | |
glTranslatef(0.0, -5.0, -30) | |
glEnable(GL_DEPTH_TEST) | |
def drs_review(video): | |
frames, ball_positions, detection_frames, debug_log = process_video(video) | |
if not frames: | |
return f"Error: Failed to process video\nDebug Log:\n{debug_log}", None | |
full_trajectory, vis_trajectory, pitch_point, pitch_frame, impact_point, impact_frame, trajectory_log = estimate_trajectory_3d(ball_positions, detection_frames, frames) | |
decision, full_trajectory, pitch_point, impact_point = lbw_decision(ball_positions, full_trajectory, frames, pitch_point, impact_point) | |
frame_height, frame_width = frames[0].shape[:2] | |
output_path = f"output_{uuid.uuid4()}.mp4" | |
slow_motion_path = generate_slow_motion(frames, vis_trajectory, pitch_point, pitch_frame, impact_point, impact_frame, detection_frames, output_path, decision, frame_width, frame_height) | |
if HAS_OPENGL: | |
init_3d_window(800, 600) | |
from OpenGL.GLUT import glutInit, glutSolidSphere | |
glutInit() | |
for _ in range(100): # Limited frames for demo | |
draw_3d_scene(full_trajectory, pitch_point, impact_point, decision) | |
event.pump() | |
debug_output = f"{debug_log}\n{trajectory_log}" | |
return f"DRS Decision: {decision}\nDebug Log:\n{debug_output}", slow_motion_path | |
# Gradio interface | |
iface = gr.Interface( | |
fn=drs_review, | |
inputs=gr.Video(label="Upload Video Clip"), | |
outputs=[ | |
gr.Textbox(label="DRS Decision and Debug Log"), | |
gr.Video(label="Slow-Motion Replay with 2D Annotations") | |
], | |
title="AI-Powered 3D DRS for LBW", | |
description="Upload a video clip for 3D DRS analysis with pitching (green), impact (red), and wickets (orange) visualization, and 2D annotated video output." | |
) | |
if __name__ == "__main__": | |
iface.launch() |