Spaces:
Sleeping
Sleeping
# Standard library imports | |
# (Add any necessary imports for future object detection implementation) | |
import json | |
# Third-party imports | |
from PIL import Image | |
import numpy as np | |
from ultralytics import YOLO | |
# Local imports | |
from utils.image_utils import load_image, preprocess_image | |
# Load the YOLOv8 model globally to avoid reloading on each function call | |
# Using a common pre-trained YOLOv8 nano model ('yolov8n.pt') | |
try: | |
model = YOLO('yolov8n.pt') | |
print("YOLOv8 model loaded successfully.") | |
except Exception as e: | |
print(f"Error loading YOLOv8 model: {e}") | |
model = None # Set model to None if loading fails | |
def object_detection(input_type, uploaded_image, image_url, base64_string): | |
""" | |
Performs object detection on the image from various input types using YOLOv8. | |
Args: | |
input_type (str): The selected input method ("Upload File", "Enter URL", "Enter Base64"). | |
uploaded_image (PIL.Image.Image): The uploaded image (if input_type is "Upload File"). | |
image_url (str): The image URL (if input_type is "Enter URL"). | |
base64_string (str): The image base64 string (if input_type is "Enter Base64"). | |
Returns: | |
tuple: A tuple containing: | |
- numpy.ndarray: The image with detected objects drawn on it, or None if an error occurred or model not loaded. | |
- dict: A dictionary containing the raw detection data (bounding boxes, classes, scores), or None. | |
""" | |
if model is None: | |
print("YOLOv8 model is not loaded. Cannot perform object detection.") | |
return None, None # Return None for both outputs | |
image = None | |
input_value = None | |
if input_type == "Upload File" and uploaded_image is not None: | |
image = uploaded_image # This is a PIL Image | |
print("Using uploaded image (PIL) for object detection") # Debug print | |
elif input_type == "Enter URL" and image_url and image_url.strip(): | |
input_value = image_url | |
print(f"Using URL for object detection: {input_value}") # Debug print | |
elif input_type == "Enter Base64" and base64_string and base64_string.strip(): | |
input_value = base64_string | |
print(f"Using Base64 string for object detection") # Debug print | |
else: | |
print("No valid input provided for object detection based on selected type.") | |
return None, None # Return None for both outputs | |
# If input_value is set (URL or Base64), use load_image | |
if input_value: | |
image = load_image(input_value) | |
if image is None: | |
return None, None # load_image failed | |
# Now 'image' should be a PIL Image or None | |
if image is None: | |
print("Image is None after loading/selection for object detection.") | |
return None, None # Return None for both outputs | |
try: | |
# Preprocess the image (convert PIL to numpy, ensure RGB) | |
processed_image_np = preprocess_image(image) | |
# Perform inference | |
results = model.predict(processed_image_np) | |
# Extract raw detection data | |
raw_data = [] | |
if results and results[0].boxes: | |
for box in results[0].boxes: | |
# box.xywh contains [x_center, y_center, width, height] | |
# box.conf contains confidence score | |
# box.cls contains class index | |
x_center, y_center, width, height = [round(float(coord), 2) for coord in box.xywh[0].tolist()] # Changed to xywh | |
confidence = round(float(box.conf[0]), 4) | |
class_id = int(box.cls[0]) | |
class_name = model.names[class_id] if model.names else str(class_id) # Get class name if available | |
raw_data.append({ | |
"box": {"x": x_center, "y": y_center, "w": width, "h": height}, # Updated keys | |
"confidence": confidence, | |
"class_id": class_id, | |
"class_name": class_name | |
}) | |
# Draw results on the image | |
result_image_np = results[0].plot() if results else processed_image_np # Plot if results exist | |
print("Object detection performed successfully.") | |
return result_image_np, raw_data # Return both the image and raw data | |
except Exception as e: | |
print(f"Error during YOLOv8 object detection: {e}") | |
return None, None # Return None for both outputs | |