Spaces:

2nzi
/

PnLCalib

Running

App Files Files Community

PnLCalib / static_calibration.py

2nzi

Upload 63 files

3d1f2c9 13 days ago

raw

history blame contribute delete

17.9 kB

	from utils.utils_keypoints import KeypointsDB
	from utils.utils_lines import LineKeypointsDB
	from utils.utils_calib import FramebyFrameCalib
	from utils.utils_heatmap import complete_keypoints
	from PIL import Image
	import torch
	import numpy as np
	import matplotlib.pyplot as plt
	from matplotlib.lines import Line2D


	cam3_line_dict = {

	"Big rect. right top": [
	{"x": 1342.8861505076343, "y": 1076.997434976179},
	{"x": 1484.7446330310781, "y": 906.3705391217808}
	],
	"Big rect. right main": [
	{"x": 1484.7446330310781, "y": 906.3705391217808},
	{"x": 1049.6210183678218, "y": 748.0287797688992},
	{"x": 828.6491513601493, "y": 668.8579000924583},
	{"x": 349.8767728435256, "y": 500.9610345717304},
	{"x": 32.736572890025556, "y": 397.21988189225624}
	],
	"Big rect. right bottom": [
	{"x": 32.736572890025556, "y": 397.21988189225624},
	{"x": 0.3753980224568448, "y": 407.0286292126068}
	],
	"Small rect. right top": [
	{"x": 312.24913494809687, "y": 1075.6461846681693},
	{"x": 426.66666666666663, "y": 999.9279904137233}
	],
	"Small rect. right main": [
	{"x": 426.66666666666663, "y": 999.9279904137233},
	{"x": 0, "y": 769.079837198949}
	],
	"Circle right": [
	{"x": 828.6491513601493, "y": 668.8579000924583},
	{"x": 821.7759602949911, "y": 612.2830792373484},
	{"x": 782.8739995106773, "y": 564.5621490047902},
	{"x": 722.6387053930304, "y": 529.3993583071158},
	{"x": 623.5014504910696, "y": 503.02726528386006},
	{"x": 494.24654853028534, "y": 492.980753655953},
	{"x": 349.8767728435256, "y": 500.9610345717304}
	],
	"Side line bottom": [
	{"x": 2.0193824656299317, "y": 266.2605192109321},
	{"x": 399.0443993689428, "y": 186.14824976426013},
	{"x": 645.5533017804819, "y": 132.93313314748357},
	{"x": 1001.1088573360372, "y": 53.39824942655338},
	{"x": 1208.1676808654488, "y": 7.351737798646435}
	],
	"Middle line": [
	{"x": 645.5533017804819, "y": 132.93313314748357},
	{"x": 1106.0585089650835, "y": 200.22939899146556},
	{"x": 1580.7388158704541, "y": 269.8451725000601},
	{"x": 1917.6527118636336, "y": 318.9857185061268}
	],
	"Circle central": [
	{"x": 1580.7388158704541, "y": 269.8451725000601},
	{"x": 1580.7388158704541, "y": 269.8451725000601},
	{"x": 1533.8366024891266, "y": 288.8643838246303},
	{"x": 1441.810458698277, "y": 302.46903498742097},
	{"x": 1316.3202626198458, "y": 304.5620582432349},
	{"x": 1219.0653606590615, "y": 292.0039187083512},
	{"x": 1135.4052299401073, "y": 274.2132210339326},
	{"x": 1069.522876998931, "y": 237.5853140571884},
	{"x": 1106.0585089650835, "y": 200.22939899146556},
	{"x": 1139.5882364760548, "y": 189.4457791734675},
	{"x": 1224.2941188289963, "y": 177.9341512664908},
	{"x": 1314.2287593518718, "y": 174.79461638276985},
	{"x": 1392.6601319008914, "y": 180.02717452230473},
	{"x": 1465.8627462799764, "y": 190.49229080137454},
	{"x": 1529.6535959531789, "y": 204.09694196416518},
	{"x": 1581.9411776525253, "y": 230.2597326618396},
	{"x": 1580.7388158704541, "y": 269.8451725000601}
	],
	"Side line left": [
	{"x": 1208.1676808654488, "y": 7.351737798646435},
	{"x": 1401.9652021886754, "y": 20.565213248502545},
	{"x": 1582.3573590514204, "y": 30.37625976013045},
	{"x": 1679.416182580832, "y": 34.300678364781604},
	{"x": 1824.5142217965183, "y": 41.23091697692868},
	{"x": 1918.6318688553417, "y": 42.21202162809147}
	],
	"Big rect. left bottom": [
	{"x": 1401.9652021886754, "y": 20.565213248502545},
	{"x": 1283.3377512082834, "y": 53.98527744204496}
	],
	"Big rect. left main": [
	{"x": 1283.3377512082834, "y": 53.98527744204496},
	{"x": 1510.7887316004399, "y": 73.60737046530076},
	{"x": 1808.8279472867146, "y": 94.21056813971936},
	{"x": 1918.6318688553417, "y": 100.0971960466961}
	],
	"Circle left": [
	{"x": 1510.7887316004399, "y": 73.60737046530076},
	{"x": 1548.0436335612244, "y": 86.36173093041702},
	{"x": 1620.5926531690673, "y": 95.19167279088215},
	{"x": 1681.3769668945574, "y": 97.15388209320773},
	{"x": 1746.0828492474989, "y": 100.0971960466961},
	{"x": 1808.8279472867146, "y": 94.21056813971936}
	],
	"Small rect. left bottom": [
	{"x": 1550.9848100318127, "y": 42.21202162809147},
	{"x": 1582.3573590514204, "y": 30.37625976013045}
	],
	"Small rect. left main": [
	{"x": 1550.9848100318127, "y": 42.21202162809147},
	{"x": 1918.418689198772, "y": 60.49417894940041}
	]
	}

	def transform_data(line_dict, width, height):
	"""
	Transform input line dictionary to normalized coordinates.

	Args:
	line_dict (dict): Dictionary containing line coordinates
	width (int): Image width
	height (int): Image height

	Returns:
	dict: Dictionary with normalized coordinates
	"""
	transformed = {}

	for line_name, points in line_dict.items():
	transformed[line_name] = []
	for point in points:
	# Normalize coordinates by dividing by image dimensions
	transformed[line_name].append({
	"x": point["x"] / width,
	"y": point["y"] / height
	})

	return transformed



	def plot_camera_position(cam_params, keypoints_dict=None, lines_dict=None):
	"""
	Plot the camera position, orientation and points relative to the football field.

	Args:
	cam_params (dict): Dictionary containing camera parameters
	keypoints_dict (dict, optional): Dictionary containing keypoints in image coordinates
	lines_dict (dict, optional): Dictionary containing lines in image coordinates
	"""
	# Field dimensions in meters
	field_length = 105
	field_width = 68

	# Get camera parameters
	camera_pos = np.array(cam_params["cam_params"]["position_meters"])
	R = np.array(cam_params["cam_params"]["rotation_matrix"])

	# Create 3D figure
	fig = plt.figure(figsize=(12, 8))
	ax = fig.add_subplot(111, projection='3d')

	# Draw main field
	field_corners = np.array([
	[-field_length/2, -field_width/2, 0],
	[field_length/2, -field_width/2, 0],
	[field_length/2, field_width/2, 0],
	[-field_length/2, field_width/2, 0],
	[-field_length/2, -field_width/2, 0]
	])
	ax.plot(field_corners[:, 0], field_corners[:, 1], field_corners[:, 2], 'g-', label='Field')

	# Add midline
	ax.plot([0, 0], [-field_width/2, field_width/2], [0, 0], 'w--', label='Midline')

	# Add penalty areas
	# Left penalty area
	penalty_line, = ax.plot([-field_length/2, -field_length/2+16.5], [-20.16, -20.16], [0, 0], 'r-', linewidth=2, label='Penalty areas')
	ax.plot([-field_length/2, -field_length/2+16.5], [20.16, 20.16], [0, 0], 'r-', linewidth=2)
	ax.plot([-field_length/2+16.5, -field_length/2+16.5], [-20.16, 20.16], [0, 0], 'r-', linewidth=2)

	# Right penalty area
	ax.plot([field_length/2, field_length/2-16.5], [-20.16, -20.16], [0, 0], 'r-', linewidth=2)
	ax.plot([field_length/2, field_length/2-16.5], [20.16, 20.16], [0, 0], 'r-', linewidth=2)
	ax.plot([field_length/2-16.5, field_length/2-16.5], [-20.16, 20.16], [0, 0], 'r-', linewidth=2)

	# Add center circle
	circle_points = 100
	theta = np.linspace(0, 2*np.pi, circle_points)
	radius = 9.15
	x = radius * np.cos(theta)
	y = radius * np.sin(theta)
	z = np.zeros_like(theta)
	ax.plot(x, y, z, 'y-', label='Center circle')

	# Plot camera position
	ax.scatter(camera_pos[0], camera_pos[1], camera_pos[2], color='red', s=100, label='Camera')

	# Draw image plane
	rect_width = 16
	rect_height = 9
	corners_cam = np.array([
	[-rect_width/2, -rect_height/2, 2],
	[rect_width/2, -rect_height/2, 2],
	[rect_width/2, rect_height/2, 2],
	[-rect_width/2, rect_height/2, 2],
	[-rect_width/2, -rect_height/2, 2]
	])
	corners_world = np.array([camera_pos + R.T @ corner for corner in corners_cam])
	ax.plot(corners_world[:, 0], corners_world[:, 1], corners_world[:, 2],
	'magenta', linewidth=2, label='Image plane')

	# Draw lines from camera to image plane corners
	for corner in corners_world[:-1]:
	ax.plot([camera_pos[0], corner[0]],
	[camera_pos[1], corner[1]],
	[camera_pos[2], corner[2]],
	'y--', alpha=0.5)

	# Draw view direction
	direction = R[2] * 10
	ax.quiver(camera_pos[0], camera_pos[1], camera_pos[2],
	direction[0], direction[1], direction[2],
	color='blue', label='View direction')

	# Set labels and title
	ax.set_xlabel('X (meters)')
	ax.set_ylabel('Y (meters)')
	ax.set_zlabel('Z (meters)')
	ax.set_title('Camera position relative to field')

	# Set axis limits with equal aspect ratio
	ax.set_xlim([-field_length/2, field_length/2])
	ax.set_ylim([-field_width/2, field_width/2])
	ax.set_zlim([-30, 10])
	ax.set_box_aspect([field_length, field_width, 40]) # Aspect ratio is 1:1:1

	# Add grid
	ax.grid(True)

	# Add goal annotations
	ax.text(-field_length/2, 0, 0, 'Left Goal', color='black')
	ax.text(field_length/2, 0, 0, 'Right Goal', color='black')

	# Calculate and display Euler angles
	euler_angles = np.array([
	np.arctan2(R[2,1], R[2,2]), # roll
	np.arctan2(-R[2,0], np.sqrt(R[2,1]2 + R[2,2]2)), # pitch
	np.arctan2(R[1,0], R[0,0]) # yaw
	]) * 180 / np.pi

	# Add camera information text
	plt.figtext(0.02, 0.02,
	f'Position: {camera_pos}\n'
	f'Focal length X: {cam_params["cam_params"]["x_focal_length"]:.2f}\n'
	f'Focal length Y: {cam_params["cam_params"]["y_focal_length"]:.2f}\n'
	f'Rotation (deg):\n'
	f'Roll: {euler_angles[0]:.1f}°\n'
	f'Pitch: {euler_angles[1]:.1f}°\n'
	f'Yaw: {euler_angles[2]:.1f}°',
	bbox=dict(facecolor='white', alpha=0.8))

	# Create custom legend
	legend_elements = [
	Line2D([0], [0], color='g', label='Field'),
	Line2D([0], [0], color='w', linestyle='--', label='Midline'),
	Line2D([0], [0], color='y', label='Center circle'),
	Line2D([0], [0], color='r', label='Penalty areas'),
	Line2D([0], [0], color='magenta', label='Image plane'),
	Line2D([0], [0], color='blue', label='View direction'),
	Line2D([0], [0], color='y', linestyle='--', label='Projection rays'),
	plt.scatter([0], [0], color='red', s=100, label='Camera'),
	]

	# Add keypoints and lines to legend if they exist
	if keypoints_dict is not None:
	legend_elements.append(plt.scatter([0], [0], color='cyan', s=50, label='Keypoints'))

	if lines_dict is not None:
	legend_elements.append(plt.scatter([0], [0], color='magenta', s=50, label='Line points'))
	legend_elements.append(Line2D([0], [0], color='m', alpha=0.5, label='Lines'))

	# Add the legend with all elements
	ax.legend(handles=legend_elements, loc='upper right')

	# Add this function to convert image points to 3D world coordinates
	def image_to_world(point_2d, cam_params):
	# Create projection matrix P
	K = np.array([
	[cam_params["cam_params"]["x_focal_length"], 0, cam_params["cam_params"]["principal_point"][0]],
	[0, cam_params["cam_params"]["y_focal_length"], cam_params["cam_params"]["principal_point"][1]],
	[0, 0, 1]
	])
	R = np.array(cam_params["cam_params"]["rotation_matrix"])
	t = -R @ np.array(cam_params["cam_params"]["position_meters"])
	P = K @ np.hstack((R, t.reshape(-1,1)))

	# Create point on image plane in homogeneous coordinates
	point_2d_h = np.array([point_2d[0], point_2d[1], 1])

	# Back-project ray from camera
	ray = np.linalg.inv(K) @ point_2d_h
	ray = R.T @ ray

	# Find intersection with Z=0 plane
	camera_pos = np.array(cam_params["cam_params"]["position_meters"])
	t = -camera_pos[2] / ray[2]
	world_point = camera_pos + t * ray

	return world_point[:2] # Return only X,Y coordinates since Z=0

	# Plot keypoints if provided
	if keypoints_dict is not None:
	for kp_key, kp_value in keypoints_dict.items():
	point_2d = np.array([kp_value['x'], kp_value['y']])
	point_3d = image_to_world(point_2d, cam_params)

	# Plot point
	ax.scatter(point_3d[0], point_3d[1], 0, color='cyan', s=50, label='Keypoints' if kp_key == 1 else "")
	# Add keypoint number as text
	ax.text(point_3d[0], point_3d[1], 0.1, str(kp_key),
	color='black', fontsize=8, ha='center', va='bottom')

	# Plot lines if provided
	if lines_dict is not None:
	for line_key, line_value in lines_dict.items():
	# Convert start point
	start_2d = np.array([line_value['x_1'], line_value['y_1']])
	start_3d = image_to_world(start_2d, cam_params)

	# Convert end point
	end_2d = np.array([line_value['x_2'], line_value['y_2']])
	end_3d = image_to_world(end_2d, cam_params)

	# Plot points and line
	ax.scatter(start_3d[0], start_3d[1], 0, color='magenta', s=50)
	ax.scatter(end_3d[0], end_3d[1], 0, color='magenta', s=50,
	label='Line points' if line_key == list(lines_dict.keys())[0] else "")
	ax.plot([start_3d[0], end_3d[0]],
	[start_3d[1], end_3d[1]],
	[0, 0], 'm-', alpha=0.5)

	plt.show()


	def plot_2d_points(image_path, keypoints_dict=None, lines_dict=None):
	"""
	Plot keypoints and lines on the original 2D image.

	Args:
	image_path (str): Path to the original image
	keypoints_dict (dict, optional): Dictionary containing keypoints in image coordinates
	lines_dict (dict, optional): Dictionary containing lines in image coordinates
	"""
	# Load and display the image
	image = plt.imread(image_path)
	plt.figure(figsize=(15, 8))
	plt.imshow(image)

	# Plot keypoints if provided
	if keypoints_dict is not None:
	for kp_key, kp_value in keypoints_dict.items():
	x, y = kp_value['x'], kp_value['y']
	plt.scatter(x, y, color='cyan', s=100)
	plt.text(x+10, y+10, str(kp_key), color='white', fontsize=8,
	bbox=dict(facecolor='black', alpha=0.7))

	# Plot lines if provided
	if lines_dict is not None:
	for line_key, line_value in lines_dict.items():
	x1, y1 = line_value['x_1'], line_value['y_1']
	x2, y2 = line_value['x_2'], line_value['y_2']
	plt.scatter([x1, x2], [y1, y2], color='magenta', s=100)
	plt.plot([x1, x2], [y1, y2], 'magenta', alpha=0.5)

	plt.title('2D Points and Lines on Original Image')
	plt.axis('off')
	plt.show()


	def main():
	# Load image
	image = Image.open("examples/input/cam1.jpg")
	# Convert PIL Image to tensor format expected by utils
	image_tensor = torch.FloatTensor(np.array(image)).permute(2, 0, 1)

	# Get actual image dimensions
	img_width, img_height = image.size

	# Transform data using actual image dimensions
	# trans_data1 = transform_data(cam1_line_dict, img_width, img_height)
	trans_data1 = transform_data(cam3_line_dict, img_width, img_height)

	# Print transformed data
	# print("\n=== Transformed Data ===")
	# for line_name, points in trans_data1.items():
	# print(f"{line_name}: {points}")

	# Initialize databases with transformed data and tensor image
	kp_db = KeypointsDB(trans_data1, image_tensor)
	ln_db = LineKeypointsDB(trans_data1, image_tensor)

	# Get keypoints and lines
	kp_db.get_full_keypoints()
	ln_db.get_lines()

	kp_dict = kp_db.keypoints_final
	ln_dict = ln_db.lines

	# Print number of keypoints and lines before completion
	print("\n=== Before Completion ===")
	print(f"Number of keypoints: {len(kp_dict)}")

	# Complete keypoints using actual image dimensions
	kp_dict, ln_dict = complete_keypoints(kp_dict, ln_dict, img_width, img_height)

	# Print number of keypoints and lines after completion
	print("\n=== After Completion ===")
	print(f"Number of keypoints: {len(kp_dict)}")

	# Print new keypoints
	print("\n=== New Keypoints ===")
	for kp_key, kp_value in kp_dict.items():
	print(f"{kp_key}: {kp_value}")

	# Initialize calibration with actual image dimensions
	cam = FramebyFrameCalib(img_width, img_height)
	cam.update(kp_dict, ln_dict)
	cam_params = cam.heuristic_voting(refine_lines=True)

	print(cam)
	print(cam_params)

	# Plot camera position and line points
	plot_camera_position(cam_params, kp_dict, ln_dict)

	# Plot 2D points
	plot_2d_points("examples/input/cam3.jpg", kp_dict, ln_dict)

	if __name__ == "__main__":
	main()