Spaces:

samuellimabraz
/

line-follow-pid

Sleeping

line-follow-pid / line_detector.py

Implement real-time line detection application with Streamlit and OpenCV. Features include webcam input, interactive HSV color adjustment, multiple line detection algorithms (Hough, Adaptive Hough, Rotated Rectangle, Fit Ellipse, RANSAC), customizable region of interest, and confidence estimation. Includes necessary modules for color detection, line detection, and PID control.

1b7bc37 unverified 4 months ago

raw

history blame contribute delete

19 kB

	#!/usr/bin/env python3

	import cv2
	import numpy as np
	import math
	from abc import ABC, abstractmethod
	from typing import Tuple

	from color_detector import ColorDetector


	## --- Approximation Methods --- ##
	class ILineEstimationMethod(ABC):
	@staticmethod
	@abstractmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	pass


	class HoughLinesP(ILineEstimationMethod):
	@staticmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	"""
	Hough lines P detection method.
	Approximating a line from the probabilistic Hough transform
	together with line fitting

	Args:
	img_detect (numpy.ndarray): Image to detect lines in.
	img_out (numpy.ndarray): Image to draw detected lines on.
	offset (tuple): Offset values for drawing.
	draw (bool): Whether to draw the detected line.

	Returns:
	tuple: Tuple containing the center_x and angle of the detected line.
	"""
	lines = cv2.HoughLinesP(
	img_detect,
	rho=1,
	theta=np.pi / 180,
	threshold=70,
	minLineLength=25,
	maxLineGap=10,
	)

	angle = center_x = float("nan")

	if lines is not None and len(lines) > 0:
	points = []
	for line in lines:
	x1, y1, x2, y2 = line[0]
	x1 += offset[0]
	y1 += offset[1]
	x2 += offset[0]
	y2 += offset[1]
	points.append([x1, y1])
	points.append([x2, y2])

	points = np.array(points, dtype=np.float32)
	[vx, vy, x, y] = cv2.fitLine(points, cv2.DIST_L2, 0, 0.01, 0.01)

	center_x = x[0]

	angle = math.degrees(math.atan2(vy[0], vx[0]))
	if angle <= 0:
	angle += 90.0
	else:
	angle -= 90.0

	if draw:
	# Draw the approximated line on the image
	m = 50
	cv2.line(
	img_out,
	(int(x[0] - m * vx[0]), int(y[0] - m * vy[0])),
	(int(x[0] + m * vx[0]), int(y[0] + m * vy[0])),
	(0, 255, 0),
	2,
	)
	cv2.circle(img_out, (int(x[0]), int(y[0])), 2, (255, 0, 0), 3)

	return center_x, angle


	class RotatedRect(ILineEstimationMethod):
	@staticmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	"""
	Rotated rectangle detection method.
	Approximates a rectangle of minimum area on the found contour

	Args:
	img_detect (numpy.ndarray): Image to detect rotated rectangle in.
	img_out (numpy.ndarray): Image to draw detected rotated rectangle on.
	offset (tuple): Offset values for drawing.
	draw (bool): Whether to draw the detected rotated rectangle.

	Returns:
	tuple: Tuple containing the center_x and angle of the detected rotated rectangle.
	"""

	contours, _ = cv2.findContours(
	img_detect, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
	)
	contours = sorted(contours, key=cv2.minAreaRect)

	angle = center_x = float("nan")

	if len(contours) > 0 and cv2.contourArea(contours[0]) > 1500:
	blackbox = cv2.minAreaRect(contours[0])
	(x_min, y_min), (w_min, h_min), angle_bb = blackbox

	if angle_bb < -45:
	angle_bb = 90 + angle_bb
	if w_min < h_min and angle_bb > 0:
	angle_bb = (90 - angle_bb) * -1
	if w_min > h_min and angle_bb < 0:
	angle_bb = 90 + angle_bb

	if angle_bb <= 0:
	angle = angle_bb + 90.0
	else:
	angle = angle_bb - 90.0

	blackbox = (x_min + offset[0], y_min + offset[1]), (w_min, h_min), angle_bb
	box = cv2.boxPoints(blackbox)
	box = np.intp(box)

	theta = np.radians(angle_bb)
	x1 = int(x_min - 100 * np.cos(theta)) + offset[0]
	y1 = int(y_min - 100 * np.sin(theta)) + offset[1]
	x2 = int(x_min + 100 * np.cos(theta)) + offset[0]
	y2 = int(y_min + 100 * np.sin(theta)) + offset[1]

	center = (int(x_min + offset[0]), int(y_min + offset[1]))
	center_x = center[0]

	if draw:
	cv2.line(img_out, (x1, y1), (x2, y2), (255, 0, 0), 3)
	cv2.circle(img_out, center, 2, (0, 255, 0), 3)

	return center_x, angle


	class FitEllipse(ILineEstimationMethod):
	@staticmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	"""
	Ellipse fitting detection method.
	Fits an ellipse to the detected contour

	Args:
	img_detect (numpy.ndarray): Image to detect ellipse in.
	img_out (numpy.ndarray): Image to draw detected ellipse on.
	offset (tuple): Offset values for drawing.
	draw (bool): Whether to draw the detected ellipse.

	Returns:
	tuple: Tuple containing the center_x and angle of the detected ellipse.
	"""

	_, img_detect = cv2.threshold(img_detect, 1, 255, cv2.THRESH_BINARY)
	contours, _ = cv2.findContours(
	img_detect, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
	)

	angle = center_x = float("nan")
	direction = curvature = None

	if len(contours) > 0:
	rope_contour = max(contours, key=cv2.contourArea)
	if cv2.contourArea(rope_contour) > 2000:
	M = cv2.moments(rope_contour)
	center_x = int(M["m10"] / M["m00"])
	epsilon = 0.006 * cv2.arcLength(rope_contour, True)
	approx_contour = cv2.approxPolyDP(rope_contour, epsilon, True)

	if len(approx_contour) >= 5:
	ellipse = cv2.fitEllipse(approx_contour)
	(xc, yc), (d1, d2), angle = ellipse
	xc += offset[0]
	yc += offset[1]
	direction = np.sign(d2 - d1)
	curvature = np.abs(d1 - d2) / max(d1, d2)

	if draw:
	# Draw the ellipse on the image
	cv2.ellipse(img_out, ((xc, yc), (d1, d2), angle), (0, 255, 0), 2)

	return center_x, angle


	class AdaptiveHoughLinesP(ILineEstimationMethod):
	@staticmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	"""
	Adaptive Hough lines detection with parameter tuning based on image characteristics.

	This method dynamically adjusts Hough transform parameters based on the image content,
	which can improve line detection in varying conditions.

	Args:
	img_detect (numpy.ndarray): Image to detect lines in.
	img_out (numpy.ndarray): Image to draw detected lines on.
	offset (tuple): Offset values for drawing.
	draw (bool): Whether to draw the detected line.

	Returns:
	tuple: Tuple containing the center_x and angle of the detected line.
	"""
	# Calculate image metrics to determine parameters
	mean_val = np.mean(img_detect)
	std_val = np.std(img_detect)

	# Adjust parameters based on image statistics
	threshold = max(30, min(100, int(mean_val + std_val)))
	min_line_length = max(15, min(50, int(img_detect.shape[1] * 0.05)))
	max_line_gap = max(5, min(20, int(min_line_length * 0.4)))

	lines = cv2.HoughLinesP(
	img_detect,
	rho=1,
	theta=np.pi / 180,
	threshold=threshold,
	minLineLength=min_line_length,
	maxLineGap=max_line_gap,
	)

	angle = center_x = float("nan")

	if lines is not None and len(lines) > 0:
	points = []
	for line in lines:
	x1, y1, x2, y2 = line[0]
	x1 += offset[0]
	y1 += offset[1]
	x2 += offset[0]
	y2 += offset[1]
	points.append([x1, y1])
	points.append([x2, y2])

	points = np.array(points, dtype=np.float32)
	[vx, vy, x, y] = cv2.fitLine(points, cv2.DIST_L2, 0, 0.01, 0.01)

	center_x = x[0]

	angle = math.degrees(math.atan2(vy[0], vx[0]))
	if angle <= 0:
	angle += 90.0
	else:
	angle -= 90.0

	if draw:
	# Draw the approximated line on the image
	m = 50
	cv2.line(
	img_out,
	(int(x[0] - m * vx[0]), int(y[0] - m * vy[0])),
	(int(x[0] + m * vx[0]), int(y[0] + m * vy[0])),
	(0, 255, 0),
	2,
	)
	cv2.circle(img_out, (int(x[0]), int(y[0])), 2, (255, 0, 0), 3)

	# Display the adaptive parameters used
	cv2.putText(
	img_out,
	f"Threshold: {threshold}",
	(10, 90),
	cv2.FONT_HERSHEY_SIMPLEX,
	0.6,
	(0, 0, 255),
	1,
	)
	cv2.putText(
	img_out,
	f"MinLen: {min_line_length}, MaxGap: {max_line_gap}",
	(10, 110),
	cv2.FONT_HERSHEY_SIMPLEX,
	0.6,
	(0, 0, 255),
	1,
	)

	return center_x, angle


	class RansacLine(ILineEstimationMethod):
	@staticmethod
	def estimate(
	img_detect: np.ndarray, img_out: np.ndarray, offset: tuple, draw: bool = True
	) -> Tuple[float, float]:
	"""
	RANSAC-based line detection method.
	Uses RANSAC to robustly fit a line to detected points, ignoring outliers.

	Args:
	img_detect (numpy.ndarray): Image to detect lines in.
	img_out (numpy.ndarray): Image to draw detected lines on.
	offset (tuple): Offset values for drawing.
	draw (bool): Whether to draw the detected line.

	Returns:
	tuple: Tuple containing the center_x and angle of the detected line.
	"""
	# Find points (could use edge detection or other methods)
	contours, _ = cv2.findContours(
	img_detect, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
	)

	angle = center_x = float("nan")

	if len(contours) > 0 and cv2.contourArea(contours[0]) > 1500:
	# Extract points from contour
	points = np.vstack(contours[0]).squeeze()

	if len(points) >= 5: # Need minimum points for RANSAC
	# Apply RANSAC to fit line (using findHomography with RANSAC)
	# Could also use cv2.estimateAffine2D or other RANSAC-based functions
	vx, vy, x, y = cv2.fitLine(
	points, cv2.DIST_L2, 0, 0.01, 0.01
	) # RANSAC could be used here

	center_x = x[0] + offset[0]

	angle = math.degrees(math.atan2(vy[0], vx[0]))
	if angle <= 0:
	angle += 90.0
	else:
	angle -= 90.0

	if draw:
	# Draw line on image
	m = 100
	cv2.line(
	img_out,
	(
	int(x[0] + offset[0] - m * vx[0]),
	int(y[0] + offset[1] - m * vy[0]),
	),
	(
	int(x[0] + offset[0] + m * vx[0]),
	int(y[0] + offset[1] + m * vy[0]),
	),
	(0, 255, 0),
	2,
	)
	cv2.circle(
	img_out,
	(int(x[0] + offset[0]), int(y[0] + offset[1])),
	3,
	(0, 0, 255),
	-1,
	)

	return center_x, angle


	class LineDetector:
	def __init__(
	self,
	hsv_values: np.ndarray \| None = None,
	estimation_method: ILineEstimationMethod = HoughLinesP,
	):
	"""
	Constructor for the LineDetector class.

	Args:
	hsv_values (np.ndarray, optional): The HSV lower and upper bounds. Defaults to None (uses default blue).
	estimation_method (ILineEstimationMethod, optional): The method to use for line estimation. Defaults to HoughLinesP.
	"""
	# Initialize ColorDetector first (using its default or handling None/color)
	self.color_detector = ColorDetector()

	# Then, if hsv_values are provided, set them using the property setter
	if hsv_values is not None:
	self.color_detector.hsv_color = hsv_values

	self.estimation_method = estimation_method

	def detect_line(self, img, region=(0, 0), draw=True):
	# apply color filter
	mask, filtered = self.color_detector.filterColor(img)

	# full image if no ROI specified
	if region == (0, 0):
	region = (img.shape[1], img.shape[0])

	# compute ROI center & offset
	h_mask, w_mask = mask.shape
	cx_mask, cy_mask = w_mask // 2, h_mask // 2
	w_roi, h_roi = region
	off_x, off_y = cx_mask - w_roi // 2, cy_mask - h_roi // 2

	# extract ROI from the mask
	roi_mask = cv2.getRectSubPix(mask, region, (cx_mask, cy_mask))

	# estimate line in ROI
	center_x = angle = float("nan")
	confidence = 0.0
	try:
	center_x, angle = self.estimation_method.estimate(
	roi_mask, img, (off_x, off_y), True
	)
	confidence = self._calculate_confidence(roi_mask, center_x, angle)
	except ValueError as e:
	print(f"Error in estimation: {e}")

	# draw diagnostics
	if draw:
	# Get image dimensions for positioning
	h, w = img.shape[:2]

	# Modern color scheme
	roi_color = (41, 128, 185) # Blue
	text_bg_color = (52, 73, 94, 180) # Dark slate with transparency
	text_color = (236, 240, 241) # Almost white

	# Draw ROI rectangle with modern blue color and thinner line
	top_left = (off_x, off_y)
	bottom_right = (off_x + w_roi, off_y + h_roi)
	cv2.rectangle(img, top_left, bottom_right, roi_color, 2)

	# Create semi-transparent overlay for metrics text
	overlay = img.copy()
	padding = 10
	metrics_width = 170
	metrics_height = 70

	# Position in top-left with padding
	cv2.rectangle(
	overlay,
	(padding, padding),
	(padding + metrics_width, padding + metrics_height),
	text_bg_color[:3], # OpenCV doesn't support alpha in rectangle
	-1
	)

	# Apply transparency
	alpha = 0.7
	cv2.addWeighted(overlay, alpha, img, 1 - alpha, 0, img)

	# Modern font
	font = cv2.FONT_HERSHEY_SIMPLEX
	font_scale = 0.6
	font_thickness = 1
	line_height = 25

	# Draw text with clean look
	text_start_x = padding + 10
	text_start_y = padding + 25

	# Function to draw text with subtle shadow for better readability
	def draw_text_with_shadow(text, pos_y):
	# Shadow effect (subtle)
	cv2.putText(
	img, text,
	(text_start_x + 1, pos_y + 1),
	font, font_scale, (0, 0, 0, 150), font_thickness
	)
	# Main text
	cv2.putText(
	img, text,
	(text_start_x, pos_y),
	font, font_scale, text_color, font_thickness
	)

	# Draw each metric
	draw_text_with_shadow(f"Angle: {angle:.2f}", text_start_y)
	draw_text_with_shadow(f"Center X: {center_x:.1f}", text_start_y + line_height)

	# return both the diagnostics and the intermediates
	return img, roi_mask, center_x, angle, confidence

	def _calculate_confidence(self, binary_img, center_x, angle):
	"""
	Calculate a confidence score for the line detection.

	Args:
	binary_img (numpy.ndarray): Binary image used for detection
	center_x (float): Detected center x coordinate
	angle (float): Detected angle

	Returns:
	float: Confidence score between 0.0 and 1.0
	"""
	if math.isnan(center_x) or math.isnan(angle):
	return 0.0

	# Calculate confidence based on:
	# 1. Number of points fitting the line
	# 2. Consistency of the line direction
	# 3. Contrast of the line against background

	# Example implementation
	white_pixels = np.sum(binary_img > 0)
	total_pixels = binary_img.size

	# More complex confidence calculation
	pixel_ratio = min(1.0, white_pixels / (total_pixels * 0.1)) # Normalize

	# Check if center is within reasonable bounds of the image
	h, w = binary_img.shape[:2]
	center_factor = 1.0
	if center_x is not None and not math.isnan(center_x):
	# How far is center_x from the center of the image (normalized 0-1)
	center_distance = abs(center_x - w / 2) / (w / 2)
	center_factor = 1.0 - min(1.0, center_distance)

	# Combine factors
	confidence = pixel_ratio * 0.6 + center_factor * 0.4

	return confidence


	def main():
	color = "teste" # Color to detect
	line_detector = LineDetector(color, HoughLinesP)

	cap = cv2.VideoCapture(0)

	while True:
	ret, frame = cap.read()

	if not ret:
	break

	result, region, center_x, angle, confidence = line_detector.detect_line(
	frame, region=(400, 400)
	)

	print(angle)

	cv2.imshow("Line Detection", result)
	if cv2.waitKey(1) == ord("q"):
	break

	cap.release()
	cv2.destroyAllWindows()


	if __name__ == "__main__":
	main()