Spaces:

Simon9
/

afrigoals

Running

App Files Files Community

afrigoals / pipeline_full.py

Simon9

Update pipeline_full.py

086e40b verified 5 days ago

raw

history blame contribute delete

47.3 kB

	# pipeline_full.py
	import os
	import json
	import base64
	from io import BytesIO
	from typing import List, Dict, Any, Optional
	from collections import deque, defaultdict

	# Silence optional-model warnings from `inference`
	os.environ["CORE_MODEL_SAM_ENABLED"] = "False"
	os.environ["CORE_MODEL_SAM2_ENABLED"] = "False"
	os.environ["CORE_MODEL_SAM3_ENABLED"] = "False"
	os.environ["CORE_MODEL_GAZE_ENABLED"] = "False"
	os.environ["CORE_MODEL_GROUNDINGDINO_ENABLED"] = "False"
	os.environ["CORE_MODEL_YOLO_WORLD_ENABLED"] = "False"

	import numpy as np
	import cv2
	import torch
	from more_itertools import chunked
	from PIL import Image
	from tqdm import tqdm

	import supervision as sv
	from inference import get_model
	from transformers import AutoProcessor, SiglipVisionModel
	import umap
	from sklearn.cluster import KMeans
	import plotly.graph_objects as go

	from sports.common.team import TeamClassifier
	from sports.common.view import ViewTransformer
	from sports.configs.soccer import SoccerPitchConfiguration
	from sports.annotators.soccer import (
	draw_pitch,
	draw_points_on_pitch,
	draw_pitch_voronoi_diagram,
	draw_paths_on_pitch,
	)

	# ------------------------------------------------------------------
	# Globals – initialized lazily so build/startup doesn't crash
	# ------------------------------------------------------------------

	PLAYER_DETECTION_MODEL = None
	FIELD_DETECTION_MODEL = None
	EMBEDDINGS_MODEL = None
	EMBEDDINGS_PROCESSOR = None
	TEAM_CLASSIFIER = None
	PITCH_CONFIG = None

	BALL_ID = 0
	GOALKEEPER_ID = 1
	PLAYER_ID = 2
	REFEREE_ID = 3

	MODELS_READY = False

	# progress tracking
	CURRENT_JOB_DIR: Optional[str] = None


	def set_job_dir(job_dir: str):
	global CURRENT_JOB_DIR
	CURRENT_JOB_DIR = job_dir


	def update_progress(stage: str, progress: float, message: str = ""):
	"""
	Write a small JSON status file in the current job dir so the UI can poll.
	"""
	if not CURRENT_JOB_DIR:
	return
	status = {
	"stage": stage,
	"progress": float(progress),
	"message": message,
	}
	os.makedirs(CURRENT_JOB_DIR, exist_ok=True)
	status_path = os.path.join(CURRENT_JOB_DIR, "status.json")
	with open(status_path, "w", encoding="utf-8") as f:
	json.dump(status, f)


	def ensure_models_loaded():
	"""
	Lazily load all heavy models and config.
	Called at the start of run_full_pipeline().
	"""
	global PLAYER_DETECTION_MODEL, FIELD_DETECTION_MODEL
	global EMBEDDINGS_MODEL, EMBEDDINGS_PROCESSOR
	global TEAM_CLASSIFIER, PITCH_CONFIG, MODELS_READY

	if MODELS_READY:
	return

	roboflow_api_key = os.environ.get("ROBOFLOW_API_KEY")
	if not roboflow_api_key:
	raise RuntimeError(
	"ROBOFLOW_API_KEY env var must be set in the Space secrets "
	"(Settings → Variables and secrets)."
	)

	# Roboflow models
	PLAYER_DETECTION_MODEL_ID = "football-players-detection-3zvbc/11"
	FIELD_DETECTION_MODEL_ID = "football-field-detection-f07vi/14"

	PLAYER_DETECTION_MODEL = get_model(
	model_id=PLAYER_DETECTION_MODEL_ID, api_key=roboflow_api_key
	)
	FIELD_DETECTION_MODEL = get_model(
	model_id=FIELD_DETECTION_MODEL_ID, api_key=roboflow_api_key
	)

	# SigLIP embeddings
	SIGLIP_MODEL_PATH = "google/siglip-base-patch16-224"
	device = get_device()
	EMBEDDINGS_MODEL = SiglipVisionModel.from_pretrained(SIGLIP_MODEL_PATH).to(device)
	EMBEDDINGS_PROCESSOR = AutoProcessor.from_pretrained(SIGLIP_MODEL_PATH)

	# Pitch + TeamClassifier
	PITCH_CONFIG = SoccerPitchConfiguration()
	TEAM_CLASSIFIER = TeamClassifier(device="cuda" if torch.cuda.is_available() else "cpu")

	MODELS_READY = True


	def get_device():
	return "cuda" if torch.cuda.is_available() else "cpu"


	# -------------------- utility for saving images --------------------


	def save_image(path: str, img: np.ndarray) -> None:
	os.makedirs(os.path.dirname(path), exist_ok=True)
	if img.ndim == 3 and img.shape[2] == 3:
	img_bgr = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
	else:
	img_bgr = img
	cv2.imwrite(path, img_bgr)


	# -------------------- 1. basic frames & detections --------------------


	def step_basic_frames(video_path: str, out_dir: str) -> Dict[str, str]:
	ensure_models_loaded()

	frame_generator = sv.get_video_frames_generator(video_path)
	frame = next(frame_generator)

	raw_path = os.path.join(out_dir, "frame_raw.png")
	save_image(raw_path, frame)

	box_annotator = sv.BoxAnnotator(
	color=sv.ColorPalette.from_hex(["#FF8C00", "#00BFFF", "#FF1493", "#FFD700"]),
	thickness=2,
	)
	label_annotator = sv.LabelAnnotator(
	color=sv.ColorPalette.from_hex(["#FF8C00", "#00BFFF", "#FF1493", "#FFD700"]),
	text_color=sv.Color.from_hex("#000000"),
	)

	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)

	labels = [
	f"{class_name} {confidence:.2f}"
	for class_name, confidence in zip(detections["class_name"], detections.confidence)
	]

	annotated = frame.copy()
	annotated = box_annotator.annotate(scene=annotated, detections=detections)
	annotated = label_annotator.annotate(scene=annotated, detections=detections, labels=labels)

	boxes_path = os.path.join(out_dir, "frame_boxes_labels.png")
	save_image(boxes_path, annotated)

	ellipse_annotator = sv.EllipseAnnotator(
	color=sv.ColorPalette.from_hex(["#00BFFF", "#FF1493", "#FFD700"]),
	thickness=2,
	)
	triangle_annotator = sv.TriangleAnnotator(
	color=sv.Color.from_hex("#FFD700"),
	base=25,
	height=21,
	outline_thickness=1,
	)

	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)

	ball_detections = detections[detections.class_id == BALL_ID]
	ball_detections.xyxy = sv.pad_boxes(xyxy=ball_detections.xyxy, px=10)

	all_detections = detections[detections.class_id != BALL_ID]
	all_detections = all_detections.with_nms(threshold=0.5, class_agnostic=True)
	all_detections.class_id -= 1

	annotated2 = frame.copy()
	annotated2 = ellipse_annotator.annotate(scene=annotated2, detections=all_detections)
	annotated2 = triangle_annotator.annotate(scene=annotated2, detections=ball_detections)

	ball_players_path = os.path.join(out_dir, "frame_ball_players.png")
	save_image(ball_players_path, annotated2)

	return {
	"raw_frame": raw_path,
	"boxes_labels": boxes_path,
	"ball_players": ball_players_path,
	}


	# -------------------- 2. SigLIP + UMAP + KMeans + HTML --------------------


	def step_siglip_clustering(video_path: str, out_dir: str) -> Dict[str, str]:
	ensure_models_loaded()

	stride = 30
	frame_generator = sv.get_video_frames_generator(source_path=video_path, stride=stride)

	crops = []
	for frame in tqdm(frame_generator, desc="collecting crops (SigLIP)"):
	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)
	detections = detections.with_nms(threshold=0.5, class_agnostic=True)
	detections = detections[detections.class_id == PLAYER_ID]
	players_crops = [sv.crop_image(frame, xyxy) for xyxy in detections.xyxy]
	crops += players_crops

	if not crops:
	return {"plot_html": ""}

	crops_pil = [sv.cv2_to_pillow(c) for c in crops]

	BATCH_SIZE = 32
	batches = chunked(crops_pil, BATCH_SIZE)
	data = []
	device = get_device()
	with torch.no_grad():
	for batch in tqdm(batches, desc="embedding extraction"):
	inputs = EMBEDDINGS_PROCESSOR(images=batch, return_tensors="pt").to(device)
	outputs = EMBEDDINGS_MODEL(**inputs)
	embeddings = torch.mean(outputs.last_hidden_state, dim=1).cpu().numpy()
	data.append(embeddings)

	data = np.concatenate(data)

	REDUCER = umap.UMAP(n_components=3)
	CLUSTERING_MODEL = KMeans(n_clusters=2, n_init="auto")

	projections = REDUCER.fit_transform(data)
	clusters = CLUSTERING_MODEL.fit_predict(projections)

	def pil_image_to_data_uri(image: Image.Image) -> str:
	buffered = BytesIO()
	image.save(buffered, format="PNG")
	img_str = base64.b64encode(buffered.getvalue()).decode("utf-8")
	return f"data:image/png;base64,{img_str}"

	image_data_uris = {f"image_{i}": pil_image_to_data_uri(img) for i, img in enumerate(crops_pil)}
	image_ids = np.array([f"image_{i}" for i in range(len(crops_pil))])

	traces = []
	unique_labels = np.unique(clusters)
	for lbl in unique_labels:
	mask = clusters == lbl
	customdata_masked = image_ids[mask]
	trace = go.Scatter3d(
	x=projections[mask][:, 0],
	y=projections[mask][:, 1],
	z=projections[mask][:, 2],
	mode="markers+text",
	text=clusters[mask],
	customdata=customdata_masked,
	name=str(lbl),
	marker=dict(size=8),
	hovertemplate="<b>class: %{text}</b><br>image ID: %{customdata}<extra></extra>",
	)
	traces.append(trace)

	min_val = np.min(projections)
	max_val = np.max(projections)
	padding = (max_val - min_val) * 0.05
	axis_range = [min_val - padding, max_val + padding]

	fig = go.Figure(data=traces)
	fig.update_layout(
	scene=dict(
	xaxis=dict(title="X", range=axis_range),
	yaxis=dict(title="Y", range=axis_range),
	zaxis=dict(title="Z", range=axis_range),
	aspectmode="cube",
	),
	width=1000,
	height=1000,
	showlegend=False,
	)

	plotly_div = fig.to_html(full_html=False, include_plotlyjs=False, div_id="scatter-plot-3d")

	javascript_code = f"""
	<script>
	function displayImage(imageId) {{
	var imageElement = document.getElementById('image-display');
	var placeholderText = document.getElementById('placeholder-text');
	var imageDataURIs = {image_data_uris};
	imageElement.src = imageDataURIs[imageId];
	imageElement.style.display = 'block';
	placeholderText.style.display = 'none';
	}}
	var chartElement = document.getElementById('scatter-plot-3d');
	chartElement.on('plotly_click', function(data) {{
	var customdata = data.points[0].customdata;
	displayImage(customdata);
	}});
	</script>
	"""

	html_template = f"""
	<!DOCTYPE html>
	<html>
	<head>
	<script src="https://cdn.plot.ly/plotly-latest.min.js"></script>
	<style>
	#image-container {{
	position: fixed;
	top: 0;
	left: 0;
	width: 200px;
	height: 200px;
	padding: 5px;
	border: 1px solid #ccc;
	background-color: white;
	z-index: 1000;
	box-sizing: border-box;
	display: flex;
	align-items: center;
	justify-content: center;
	text-align: center;
	}}
	#image-display {{
	width: 100%;
	height: 100%;
	object-fit: contain;
	}}
	</style>
	</head>
	<body>
	{plotly_div}
	<div id="image-container">
	<img id="image-display" src="" alt="Selected image" style="display: none;" />
	<p id="placeholder-text">Click on a data entry to display an image</p>
	</div>
	{javascript_code}
	</body>
	</html>
	"""

	os.makedirs(out_dir, exist_ok=True)
	html_path = os.path.join(out_dir, "siglip_clusters.html")
	with open(html_path, "w", encoding="utf-8") as f:
	f.write(html_template)

	return {"plot_html": html_path}


	# -------------------- 3. TeamClassifier training --------------------


	def train_team_classifier_on_video(video_path: str, stride: int = 30) -> None:
	ensure_models_loaded()

	frame_generator = sv.get_video_frames_generator(source_path=video_path, stride=stride)
	crops = []
	for frame in tqdm(frame_generator, desc="collecting crops (TeamClassifier)"):
	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)
	players_detections = detections[detections.class_id == PLAYER_ID]
	players_crops = [sv.crop_image(frame, xyxy) for xyxy in players_detections.xyxy]
	crops += players_crops

	if crops:
	TEAM_CLASSIFIER.fit(crops)


	# -------------------- 4. goalkeeper team resolution --------------------


	def resolve_goalkeepers_team_id(players: sv.Detections, goalkeepers: sv.Detections) -> np.ndarray:
	if len(goalkeepers) == 0 or len(players) == 0:
	return np.array([])
	goalkeepers_xy = goalkeepers.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	players_xy = players.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	team_0_centroid = players_xy[players.class_id == 0].mean(axis=0)
	team_1_centroid = players_xy[players.class_id == 1].mean(axis=0)
	goalkeepers_team_id = []
	for goalkeeper_xy in goalkeepers_xy:
	dist_0 = np.linalg.norm(goalkeeper_xy - team_0_centroid)
	dist_1 = np.linalg.norm(goalkeeper_xy - team_1_centroid)
	goalkeepers_team_id.append(0 if dist_0 < dist_1 else 1)
	return np.array(goalkeepers_team_id)


	# -------------------- 5. Voronoi blend helper --------------------


	def draw_pitch_voronoi_diagram_2(
	config: SoccerPitchConfiguration,
	team_1_xy: np.ndarray,
	team_2_xy: np.ndarray,
	team_1_color: sv.Color = sv.Color.RED,
	team_2_color: sv.Color = sv.Color.WHITE,
	opacity: float = 0.5,
	padding: int = 50,
	scale: float = 0.1,
	pitch: Optional[np.ndarray] = None,
	) -> np.ndarray:
	if pitch is None:
	pitch = draw_pitch(config=config, padding=padding, scale=scale)

	scaled_width = int(config.width * scale)
	scaled_length = int(config.length * scale)

	voronoi = np.zeros_like(pitch, dtype=np.uint8)

	team_1_color_bgr = np.array(team_1_color.as_bgr(), dtype=np.uint8)
	team_2_color_bgr = np.array(team_2_color.as_bgr(), dtype=np.uint8)

	y_coordinates, x_coordinates = np.indices((scaled_width + 2 * padding, scaled_length + 2 * padding))
	y_coordinates -= padding
	x_coordinates -= padding

	def calculate_distances(xy, x_coordinates, y_coordinates):
	return np.sqrt(
	(xy[:, 0][:, None, None] * scale - x_coordinates) ** 2
	+ (xy[:, 1][:, None, None] * scale - y_coordinates) ** 2
	)

	distances_team_1 = calculate_distances(team_1_xy, x_coordinates, y_coordinates)
	distances_team_2 = calculate_distances(team_2_xy, x_coordinates, y_coordinates)

	min_distances_team_1 = np.min(distances_team_1, axis=0)
	min_distances_team_2 = np.min(distances_team_2, axis=0)

	steepness = 15
	distance_ratio = min_distances_team_2 / np.clip(
	min_distances_team_1 + min_distances_team_2, a_min=1e-5, a_max=None
	)
	blend_factor = np.tanh((distance_ratio - 0.5) * steepness) * 0.5 + 0.5

	for c in range(3):
	voronoi[:, :, c] = (
	blend_factor * team_1_color_bgr[c] + (1 - blend_factor) * team_2_color_bgr[c]
	).astype(np.uint8)

	overlay = cv2.addWeighted(voronoi, opacity, pitch, 1 - opacity, 0)
	return overlay


	# -------------------- 6. single-frame advanced views --------------------


	def step_single_frame_advanced(video_path: str, out_dir: str) -> Dict[str, str]:
	ensure_models_loaded()

	frame_generator = sv.get_video_frames_generator(video_path)
	frame = next(frame_generator)

	ellipse_annotator = sv.EllipseAnnotator(
	color=sv.ColorPalette.from_hex(["#00BFFF", "#FF1493", "#FFD700"]),
	thickness=2,
	)
	label_annotator = sv.LabelAnnotator(
	color=sv.ColorPalette.from_hex(["#00BFFF", "#FF1493", "#FFD700"]),
	text_color=sv.Color.from_hex("#000000"),
	text_position=sv.Position.BOTTOM_CENTER,
	)
	triangle_annotator = sv.TriangleAnnotator(
	color=sv.Color.from_hex("#FFD700"), base=25, height=21, outline_thickness=1
	)

	tracker = sv.ByteTrack()
	tracker.reset()

	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)

	ball_detections = detections[detections.class_id == BALL_ID]
	ball_detections.xyxy = sv.pad_boxes(xyxy=ball_detections.xyxy, px=10)

	all_detections = detections[detections.class_id != BALL_ID]
	all_detections = all_detections.with_nms(threshold=0.5, class_agnostic=True)
	all_detections = tracker.update_with_detections(detections=all_detections)

	goalkeepers_detections = all_detections[all_detections.class_id == GOALKEEPER_ID]
	players_detections = all_detections[all_detections.class_id == PLAYER_ID]
	referees_detections = all_detections[all_detections.class_id == REFEREE_ID]

	players_crops = [sv.crop_image(frame, xyxy) for xyxy in players_detections.xyxy]
	if players_crops:
	players_detections.class_id = TEAM_CLASSIFIER.predict(players_crops)

	if len(goalkeepers_detections) > 0 and len(players_detections) > 0:
	goalkeepers_detections.class_id = resolve_goalkeepers_team_id(
	players_detections, goalkeepers_detections
	)

	referees_detections.class_id -= 1

	all_detections2 = sv.Detections.merge(
	[players_detections, goalkeepers_detections, referees_detections]
	)

	labels = [f"#{tid}" for tid in all_detections2.tracker_id]
	all_detections2.class_id = all_detections2.class_id.astype(int)

	annotated_frame = frame.copy()
	annotated_frame = ellipse_annotator.annotate(scene=annotated_frame, detections=all_detections2)
	annotated_frame = label_annotator.annotate(
	scene=annotated_frame, detections=all_detections2, labels=labels
	)
	annotated_frame = triangle_annotator.annotate(
	scene=annotated_frame, detections=ball_detections
	)

	os.makedirs(out_dir, exist_ok=True)
	annotated_path = os.path.join(out_dir, "frame_advanced.png")
	save_image(annotated_path, annotated_frame)

	# Pitch + radar + Voronoi
	result = FIELD_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	key_points = sv.KeyPoints.from_inference(result)

	filt = key_points.confidence[0] > 0.5
	frame_reference_points = key_points.xy[0][filt]
	pitch_reference_points = np.array(PITCH_CONFIG.vertices)[filt]

	transformer = ViewTransformer(source=frame_reference_points, target=pitch_reference_points)

	frame_ball_xy = ball_detections.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	pitch_ball_xy = transformer.transform_points(points=frame_ball_xy)

	players_xy = players_detections.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	pitch_players_xy = transformer.transform_points(points=players_xy)

	referees_xy = referees_detections.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	pitch_referees_xy = transformer.transform_points(points=referees_xy)

	radar = draw_pitch(PITCH_CONFIG)
	radar = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_ball_xy,
	face_color=sv.Color.WHITE,
	edge_color=sv.Color.BLACK,
	radius=10,
	pitch=radar,
	)
	radar = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_players_xy[players_detections.class_id == 0],
	face_color=sv.Color.from_hex("00BFFF"),
	edge_color=sv.Color.BLACK,
	radius=16,
	pitch=radar,
	)
	radar = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_players_xy[players_detections.class_id == 1],
	face_color=sv.Color.from_hex("FF1493"),
	edge_color=sv.Color.BLACK,
	radius=16,
	pitch=radar,
	)
	radar = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_referees_xy,
	face_color=sv.Color.from_hex("FFD700"),
	edge_color=sv.Color.BLACK,
	radius=16,
	pitch=radar,
	)
	radar_path = os.path.join(out_dir, "radar_view.png")
	save_image(radar_path, radar)

	vor = draw_pitch(PITCH_CONFIG)
	vor = draw_pitch_voronoi_diagram(
	config=PITCH_CONFIG,
	team_1_xy=pitch_players_xy[players_detections.class_id == 0],
	team_2_xy=pitch_players_xy[players_detections.class_id == 1],
	team_1_color=sv.Color.from_hex("00BFFF"),
	team_2_color=sv.Color.from_hex("FF1493"),
	pitch=vor,
	)
	vor_path = os.path.join(out_dir, "voronoi.png")
	save_image(vor_path, vor)

	blended = draw_pitch(
	config=PITCH_CONFIG, background_color=sv.Color.WHITE, line_color=sv.Color.BLACK
	)
	blended = draw_pitch_voronoi_diagram_2(
	config=PITCH_CONFIG,
	team_1_xy=pitch_players_xy[players_detections.class_id == 0],
	team_2_xy=pitch_players_xy[players_detections.class_id == 1],
	team_1_color=sv.Color.from_hex("00BFFF"),
	team_2_color=sv.Color.from_hex("FF1493"),
	pitch=blended,
	)
	blended = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_ball_xy,
	face_color=sv.Color.WHITE,
	edge_color=sv.Color.WHITE,
	radius=8,
	thickness=1,
	pitch=blended,
	)
	blended = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_players_xy[players_detections.class_id == 0],
	face_color=sv.Color.from_hex("00BFFF"),
	edge_color=sv.Color.WHITE,
	radius=16,
	thickness=1,
	pitch=blended,
	)
	blended = draw_points_on_pitch(
	config=PITCH_CONFIG,
	xy=pitch_players_xy[players_detections.class_id == 1],
	face_color=sv.Color.from_hex("FF1493"),
	edge_color=sv.Color.WHITE,
	radius=16,
	thickness=1,
	pitch=blended,
	)
	blended_path = os.path.join(out_dir, "voronoi_blended.png")
	save_image(blended_path, blended)

	return {
	"frame_advanced": annotated_path,
	"radar": radar_path,
	"voronoi": vor_path,
	"voronoi_blended": blended_path,
	}


	# -------------------- 7. ball path & cleaning --------------------


	def replace_outliers_based_on_distance(positions: List[np.ndarray], distance_threshold: float) -> List[np.ndarray]:
	last_valid_position = None
	cleaned_positions: List[np.ndarray] = []

	for position in positions:
	if len(position) == 0:
	cleaned_positions.append(position)
	else:
	if last_valid_position is None:
	cleaned_positions.append(position)
	last_valid_position = position
	else:
	distance = np.linalg.norm(position - last_valid_position)
	if distance > distance_threshold:
	cleaned_positions.append(np.array([], dtype=np.float64))
	else:
	cleaned_positions.append(position)
	last_valid_position = position

	return cleaned_positions


	def step_ball_path(video_path: str, out_dir: str) -> Dict[str, Any]:
	ensure_models_loaded()

	MAXLEN = 5
	MAX_DISTANCE_THRESHOLD = 500

	video_info = sv.VideoInfo.from_video_path(video_path)
	frame_generator = sv.get_video_frames_generator(video_path)

	path_raw: List[np.ndarray] = []
	M = deque(maxlen=MAXLEN)

	for frame in tqdm(frame_generator, total=video_info.total_frames, desc="ball path"):
	result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(result)

	ball_detections = detections[detections.class_id == BALL_ID]
	ball_detections.xyxy = sv.pad_boxes(xyxy=ball_detections.xyxy, px=10)

	result = FIELD_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	key_points = sv.KeyPoints.from_inference(result)

	filt = key_points.confidence[0] > 0.5
	frame_reference_points = key_points.xy[0][filt]
	pitch_reference_points = np.array(PITCH_CONFIG.vertices)[filt]

	transformer = ViewTransformer(
	source=frame_reference_points, target=pitch_reference_points
	)
	M.append(transformer.m)
	transformer.m = np.mean(np.array(M), axis=0)

	frame_ball_xy = ball_detections.get_anchors_coordinates(sv.Position.BOTTOM_CENTER)
	pitch_ball_xy = transformer.transform_points(points=frame_ball_xy)

	path_raw.append(pitch_ball_xy)

	path = [
	np.empty((0, 2), dtype=np.float32) if coords.shape[0] >= 2 else coords
	for coords in path_raw
	]
	path = [coords.flatten() for coords in path]

	path_clean = replace_outliers_based_on_distance(path, MAX_DISTANCE_THRESHOLD)

	raw_pitch = draw_pitch(PITCH_CONFIG)
	raw_pitch = draw_paths_on_pitch(
	config=PITCH_CONFIG, paths=[path], color=sv.Color.WHITE, pitch=raw_pitch
	)
	raw_path_img = os.path.join(out_dir, "ball_path_raw.png")
	save_image(raw_path_img, raw_pitch)

	clean_pitch = draw_pitch(PITCH_CONFIG)
	clean_pitch = draw_paths_on_pitch(
	config=PITCH_CONFIG, paths=[path_clean], color=sv.Color.WHITE, pitch=clean_pitch
	)
	cleaned_path_img = os.path.join(out_dir, "ball_path_cleaned.png")
	save_image(cleaned_path_img, clean_pitch)

	coords_clean = [
	coords.tolist() if len(coords) > 0 else [] for coords in path_clean
	]

	return {
	"ball_path_raw_img": raw_path_img,
	"ball_path_cleaned_img": cleaned_path_img,
	"ball_path_cleaned_coords": coords_clean,
	}


	# -------------------- 8. full-match analysis + event-annotated video --------------------


	def step_analyze_and_annotate_video(video_path: str, out_dir: str) -> Dict[str, Any]:
	"""
	Single pass over the video that:
	* tracks players & ball
	* computes distance & speed per player (pitch coordinates)
	* estimates ball possession per team & per player
	* estimates time spent in defensive/middle/attacking thirds
	* detects simple events:
	- passes (successful between teammates)
	- tackles / interceptions (winning ball from opponent)
	- clearances
	- shots (high-speed ball towards goal)
	* renders an annotated MP4 with overlays:
	- per-player labels: id, team, speed, distance
	- possession HUD per team
	- event banners
	"""
	ensure_models_loaded()
	os.makedirs(out_dir, exist_ok=True)

	video_info = sv.VideoInfo.from_video_path(video_path)
	fps = video_info.fps
	dt = 1.0 / max(fps, 1.0)

	tracker = sv.ByteTrack()
	tracker.reset()

	# homography smoothing
	Ms = deque(maxlen=5)

	# stats
	distance_covered_m = defaultdict(float) # tid -> meters
	possession_time_player = defaultdict(float) # tid -> seconds
	possession_time_team = defaultdict(float) # team_id -> seconds
	team_of_player: Dict[int, int] = {} # tid -> team_id

	# per-player richer stats for coaches
	player_stats: Dict[int, Dict[str, Any]] = defaultdict(
	lambda: {
	"distance_m": 0.0,
	"max_speed_kmh": 0.0,
	"time_def_third_s": 0.0,
	"time_mid_third_s": 0.0,
	"time_att_third_s": 0.0,
	"touches": 0,
	"successful_passes": 0,
	"received_passes": 0,
	"shots": 0,
	"tackles": 0,
	"interceptions": 0,
	"clearances": 0,
	}
	)

	events: List[Dict[str, Any]] = []

	# last positions for speed / distance (per frame)
	prev_positions: Dict[int, np.ndarray] = {}
	prev_owner_tid: Optional[int] = None
	prev_ball_pos_pitch: Optional[np.ndarray] = None

	# simple goal centers in pitch coordinates (x is length, y is width)
	goal_centers = {
	0: np.array([0.0, PITCH_CONFIG.width / 2.0]),
	1: np.array([PITCH_CONFIG.length, PITCH_CONFIG.width / 2.0]),
	}

	# annotators
	ellipse_annotator = sv.EllipseAnnotator(
	color=sv.ColorPalette.from_hex(["#00BFFF", "#FF1493", "#FFD700"]),
	thickness=2,
	)
	label_annotator = sv.LabelAnnotator(
	color=sv.ColorPalette.from_hex(["#00BFFF", "#FF1493", "#FFD700"]),
	text_color=sv.Color.from_hex("#000000"),
	text_position=sv.Position.BOTTOM_CENTER,
	)
	triangle_annotator = sv.TriangleAnnotator(
	color=sv.Color.from_hex("#FFD700"), base=25, height=21, outline_thickness=1
	)

	sink_path = os.path.join(out_dir, "annotated_events.mp4")
	sink = sv.VideoSink(sink_path, video_info)

	# text overlay control
	current_event_text = ""
	event_text_frames_left = 0
	EVENT_TEXT_DURATION_S = 2.0
	EVENT_TEXT_DURATION_FRAMES = int(EVENT_TEXT_DURATION_S * fps)

	frame_generator = sv.get_video_frames_generator(video_path)

	with sink:
	for frame_idx, frame in enumerate(
	tqdm(frame_generator, total=video_info.total_frames, desc="analyze + annotate")
	):
	t = frame_idx * dt

	# --- detections + tracking ---
	det_result = PLAYER_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	detections = sv.Detections.from_inference(det_result)

	ball_dets = detections[detections.class_id == BALL_ID]
	ball_dets.xyxy = sv.pad_boxes(xyxy=ball_dets.xyxy, px=10)

	non_ball = detections[detections.class_id != BALL_ID]
	non_ball = non_ball.with_nms(threshold=0.5, class_agnostic=True)
	tracked = tracker.update_with_detections(non_ball)

	goalkeepers_dets = tracked[tracked.class_id == GOALKEEPER_ID]
	players_dets = tracked[tracked.class_id == PLAYER_ID]
	referees_dets = tracked[tracked.class_id == REFEREE_ID]

	# --- field homography ---
	field_result = FIELD_DETECTION_MODEL.infer(frame, confidence=0.3)[0]
	key_points = sv.KeyPoints.from_inference(field_result)
	filt = key_points.confidence[0] > 0.5
	frame_ref = key_points.xy[0][filt]
	pitch_ref = np.array(PITCH_CONFIG.vertices)[filt]

	if len(frame_ref) < 4:
	# Not enough field points: just draw detections and skip advanced stats
	annotated = frame.copy()
	annotated = ellipse_annotator.annotate(scene=annotated, detections=players_dets)
	annotated = triangle_annotator.annotate(scene=annotated, detections=ball_dets)
	sink.write_frame(annotated)
	continue

	transformer = ViewTransformer(source=frame_ref, target=pitch_ref)
	Ms.append(transformer.m)
	transformer.m = np.mean(np.array(Ms), axis=0)

	# --- team classification & pitch positions ---
	frame_players_xy_pitch = None
	frame_ball_pos_pitch = None
	current_positions: Dict[int, np.ndarray] = {}
	current_speed_kmh: Dict[int, float] = {}

	if len(players_dets) > 0:
	crops = [sv.crop_image(frame, xyxy) for xyxy in players_dets.xyxy]
	team_preds = TEAM_CLASSIFIER.predict(crops)
	players_dets.class_id = team_preds # now class_id = team_id (0/1)

	frame_players_xy_img = players_dets.get_anchors_coordinates(
	sv.Position.BOTTOM_CENTER
	)
	frame_players_xy_pitch = transformer.transform_points(
	points=frame_players_xy_img
	)

	pitch_length = PITCH_CONFIG.length

	for tid, team_id, pos_pitch in zip(
	players_dets.tracker_id, players_dets.class_id, frame_players_xy_pitch
	):
	tid_int = int(tid)
	team_of_player[tid_int] = int(team_id)
	current_positions[tid_int] = pos_pitch

	prev_pos = prev_positions.get(tid_int)
	speed_kmh = 0.0
	if prev_pos is not None:
	dist_m = float(np.linalg.norm(pos_pitch - prev_pos))
	distance_covered_m[tid_int] += dist_m
	player_stats[tid_int]["distance_m"] += dist_m
	speed_kmh = (dist_m / dt) * 3.6
	player_stats[tid_int]["max_speed_kmh"] = max(
	player_stats[tid_int]["max_speed_kmh"], speed_kmh
	)
	current_speed_kmh[tid_int] = speed_kmh

	# zone times: defensive / middle / attacking thirds
	x_pos = pos_pitch[0]
	if x_pos < pitch_length / 3.0:
	player_stats[tid_int]["time_def_third_s"] += dt
	elif x_pos < 2.0 * pitch_length / 3.0:
	player_stats[tid_int]["time_mid_third_s"] += dt
	else:
	player_stats[tid_int]["time_att_third_s"] += dt

	if len(ball_dets) > 0:
	frame_ball_xy_img = ball_dets.get_anchors_coordinates(
	sv.Position.BOTTOM_CENTER
	)
	frame_ball_xy_pitch = transformer.transform_points(points=frame_ball_xy_img)
	frame_ball_pos_pitch = frame_ball_xy_pitch[0]

	# --- possession owner ---
	owner_tid: Optional[int] = None
	POSSESSION_RADIUS_M = 5.0

	if frame_ball_pos_pitch is not None and frame_players_xy_pitch is not None:
	dists = np.linalg.norm(frame_players_xy_pitch - frame_ball_pos_pitch, axis=1)
	j = int(np.argmin(dists))
	if dists[j] < POSSESSION_RADIUS_M:
	owner_tid = int(players_dets.tracker_id[j])

	# accumulate possession time
	if owner_tid is not None:
	possession_time_player[owner_tid] += dt
	owner_team = team_of_player.get(owner_tid)
	if owner_team is not None:
	possession_time_team[owner_team] += dt

	# --- helper to register events & banner text ---
	def register_event(ev: Dict[str, Any], text: str):
	nonlocal current_event_text, event_text_frames_left
	events.append(ev)
	if text:
	current_event_text = text
	event_text_frames_left = EVENT_TEXT_DURATION_FRAMES

	# --- possession change events, passes, tackles, interceptions ---
	if owner_tid != prev_owner_tid:
	if owner_tid is not None:
	player_stats[owner_tid]["touches"] += 1

	if owner_tid is not None and prev_owner_tid is not None:
	prev_team = team_of_player.get(prev_owner_tid)
	cur_team = team_of_player.get(owner_tid)

	travel_m = 0.0
	if prev_ball_pos_pitch is not None and frame_ball_pos_pitch is not None:
	travel_m = float(
	np.linalg.norm(frame_ball_pos_pitch - prev_ball_pos_pitch)
	)

	MIN_PASS_TRAVEL_M = 3.0

	if prev_team is not None and cur_team is not None:
	if prev_team == cur_team and travel_m > MIN_PASS_TRAVEL_M:
	# pass
	register_event(
	{
	"type": "pass",
	"t": float(t),
	"from_tid": int(prev_owner_tid),
	"to_tid": int(owner_tid),
	"team_id": int(cur_team),
	"extra": {"distance_m": travel_m},
	},
	f"Pass: #{prev_owner_tid} → #{owner_tid} (Team {cur_team})",
	)
	player_stats[prev_owner_tid]["successful_passes"] += 1
	player_stats[owner_tid]["received_passes"] += 1
	elif prev_team != cur_team:
	# tackle vs interception
	d_pp = 999.0
	pos_prev = prev_positions.get(int(prev_owner_tid))
	pos_cur = current_positions.get(int(owner_tid))
	if pos_prev is not None and pos_cur is not None:
	d_pp = float(np.linalg.norm(pos_prev - pos_cur))
	ev_type = "tackle" if d_pp < 3.0 else "interception"
	label = "Tackle" if ev_type == "tackle" else "Interception"
	register_event(
	{
	"type": ev_type,
	"t": float(t),
	"from_tid": int(prev_owner_tid),
	"to_tid": int(owner_tid),
	"team_id": int(cur_team),
	"extra": {
	"player_distance_m": d_pp,
	"ball_travel_m": travel_m,
	},
	},
	f"{label}: #{owner_tid} wins ball from #{prev_owner_tid}",
	)
	if ev_type == "tackle":
	player_stats[owner_tid]["tackles"] += 1
	else:
	player_stats[owner_tid]["interceptions"] += 1

	# generic possession-change event
	register_event(
	{
	"type": "possession_change",
	"t": float(t),
	"from_tid": int(prev_owner_tid) if prev_owner_tid is not None else None,
	"to_tid": int(owner_tid) if owner_tid is not None else None,
	"team_id": int(team_of_player.get(owner_tid))
	if owner_tid is not None
	else None,
	"extra": {},
	},
	"" if owner_tid is None else f"Team {team_of_player.get(owner_tid)} in possession",
	)

	# --- shot / clearance based on ball speed & direction ---
	if (
	prev_ball_pos_pitch is not None
	and frame_ball_pos_pitch is not None
	and owner_tid is not None
	):
	v = (frame_ball_pos_pitch - prev_ball_pos_pitch) / dt # m/s
	speed_mps = float(np.linalg.norm(v))
	speed_kmh = speed_mps * 3.6
	HIGH_SPEED_KMH = 18.0 # threshold for "hard" actions

	if speed_kmh > HIGH_SPEED_KMH:
	shooter_team = team_of_player.get(owner_tid)
	if shooter_team is not None:
	target_goal = goal_centers[1 - shooter_team]
	direction = target_goal - frame_ball_pos_pitch
	cos_angle = float(
	np.dot(v, direction)
	/ (np.linalg.norm(v) * np.linalg.norm(direction) + 1e-6)
	)

	if cos_angle > 0.8:
	register_event(
	{
	"type": "shot",
	"t": float(t),
	"from_tid": int(owner_tid),
	"to_tid": None,
	"team_id": int(shooter_team),
	"extra": {"speed_kmh": speed_kmh},
	},
	f"Shot by #{owner_tid} (Team {shooter_team}) – {speed_kmh:.1f} km/h",
	)
	player_stats[owner_tid]["shots"] += 1
	else:
	register_event(
	{
	"type": "clearance",
	"t": float(t),
	"from_tid": int(owner_tid),
	"to_tid": None,
	"team_id": int(shooter_team),
	"extra": {"speed_kmh": speed_kmh},
	},
	f"Clearance by #{owner_tid} (Team {shooter_team})",
	)
	player_stats[owner_tid]["clearances"] += 1

	prev_owner_tid = owner_tid
	prev_ball_pos_pitch = frame_ball_pos_pitch
	prev_positions = current_positions

	# --- frame drawing ---
	annotated = frame.copy()

	# build labels for players: id + team + current speed + total distance
	player_labels: List[str] = []
	if frame_players_xy_pitch is not None and len(players_dets) > 0:
	for tid, pos_pitch in zip(players_dets.tracker_id, frame_players_xy_pitch):
	tid_int = int(tid)
	team_id = team_of_player.get(tid_int, -1)
	speed_kmh = current_speed_kmh.get(tid_int, 0.0)
	d_total = distance_covered_m[tid_int]
	player_labels.append(
	f"#{tid_int} T{team_id} {speed_kmh:4.1f} km/h {d_total:.1f} m"
	)

	annotated = ellipse_annotator.annotate(
	scene=annotated, detections=players_dets
	)
	annotated = label_annotator.annotate(
	scene=annotated, detections=players_dets, labels=player_labels
	)

	# draw ball
	annotated = triangle_annotator.annotate(scene=annotated, detections=ball_dets)

	# --- HUD: possession percentages ---
	total_poss_time = sum(possession_time_team.values()) + 1e-6
	team0_pct = (
	100.0 * possession_time_team.get(0, 0.0) / total_poss_time
	if total_poss_time > 0
	else 0.0
	)
	team1_pct = (
	100.0 * possession_time_team.get(1, 0.0) / total_poss_time
	if total_poss_time > 0
	else 0.0
	)

	hud_text = (
	f"Team 0 Ball Control: {team0_pct:5.2f}% "
	f"Team 1 Ball Control: {team1_pct:5.2f}%"
	)
	cv2.rectangle(
	annotated,
	(20, annotated.shape[0] - 60),
	(annotated.shape[1] - 20, annotated.shape[0] - 20),
	(255, 255, 255),
	-1,
	)
	cv2.putText(
	annotated,
	hud_text,
	(30, annotated.shape[0] - 30),
	cv2.FONT_HERSHEY_SIMPLEX,
	0.8,
	(0, 0, 0),
	2,
	cv2.LINE_AA,
	)

	# --- event banner ---
	if event_text_frames_left > 0 and current_event_text:
	cv2.rectangle(
	annotated, (20, 20), (annotated.shape[1] - 20, 90), (255, 255, 255), -1
	)
	cv2.putText(
	annotated,
	current_event_text,
	(30, 70),
	cv2.FONT_HERSHEY_SIMPLEX,
	1.0,
	(0, 0, 0),
	2,
	cv2.LINE_AA,
	)
	event_text_frames_left -= 1

	sink.write_frame(annotated)

	# finalize stats
	total_poss = sum(possession_time_team.values()) + 1e-6
	possession_percent_team = {
	int(team): 100.0 * t_sec / total_poss for team, t_sec in possession_time_team.items()
	}

	stats = {
	"distance_covered_m": {str(tid): float(d) for tid, d in distance_covered_m.items()},
	"possession_time_player_s": {
	str(tid): float(t_sec) for tid, t_sec in possession_time_player.items()
	},
	"possession_time_team_s": {
	int(team): float(t_sec) for team, t_sec in possession_time_team.items()
	},
	"possession_percent_team": possession_percent_team,
	"team_of_player": {str(tid): int(team) for tid, team in team_of_player.items()},
	"player_stats": {
	str(tid): {
	k: float(v) if isinstance(v, (int, float)) else v
	for k, v in stats_dict.items()
	}
	for tid, stats_dict in player_stats.items()
	},
	}

	return {
	"annotated_video": sink_path,
	"stats": stats,
	"events": events,
	}


	# -------------------- 9. full pipeline entrypoint --------------------


	def run_full_pipeline(video_path: str, job_dir: str) -> Dict[str, Any]:
	"""
	Run the full notebook-equivalent pipeline on a video and save all artifacts
	into job_dir. Returns paths + stats for the FastAPI app.
	"""
	set_job_dir(job_dir)
	update_progress("initializing", 0.0, "Loading models...")
	ensure_models_loaded()

	os.makedirs(job_dir, exist_ok=True)

	update_progress("siglip", 0.10, "Running SigLIP clustering...")
	siglip_out = step_siglip_clustering(video_path, os.path.join(job_dir, "siglip"))

	update_progress("team_classifier", 0.25, "Training TeamClassifier...")
	train_team_classifier_on_video(video_path)

	update_progress("basic_frames", 0.35, "Generating basic annotated frames...")
	basic_paths = step_basic_frames(video_path, os.path.join(job_dir, "frames"))

	update_progress("advanced_views", 0.45, "Generating advanced radar / Voronoi views...")
	adv_paths = step_single_frame_advanced(video_path, os.path.join(job_dir, "advanced"))

	update_progress("ball_path", 0.60, "Computing ball path and heatmap...")
	ball_paths = step_ball_path(video_path, os.path.join(job_dir, "ball_path"))

	update_progress(
	"events_video",
	0.80,
	"Analyzing match, computing speed/distance, and rendering event-annotated video...",
	)
	analysis_out = step_analyze_and_annotate_video(
	video_path, os.path.join(job_dir, "analysis")
	)

	result = {
	"basic": basic_paths,
	"advanced": adv_paths,
	"ball": ball_paths,
	"stats": analysis_out["stats"],
	"events": analysis_out["events"],
	"annotated_video": analysis_out["annotated_video"],
	"siglip_html": siglip_out["plot_html"],
	}

	# Save a copy for the UI result page
	result_path = os.path.join(job_dir, "result.json")
	with open(result_path, "w", encoding="utf-8") as f:
	json.dump(result, f)

	update_progress("done", 1.0, "Completed")

	return result