Spaces:

syedfaisalabrar
/

License_Classification

Sleeping

App Files Files Community

License_Classification / app.py

syedfaisalabrar

Update app.py

04dd650 verified 6 months ago

raw

history blame

3.03 kB

	import gradio as gr
	import torch
	import cv2
	import numpy as np
	from PIL import Image
	from ultralytics import YOLO
	import json


	model_path = "best.pt"
	model = YOLO(model_path)

	def preprocess_image(image):
	"""Apply enhancement filters and resize image before detection."""
	image = np.array(image)


	image = cv2.convertScaleAbs(image, alpha=0.8, beta=0) # Brightness reduction
	image = cv2.GaussianBlur(image, (3, 3), 0) # Denoising
	kernel = np.array([[0, -1, 0], [-1, 5, -1], [0, -1, 0]]) # Sharpening
	image = cv2.filter2D(image, -1, kernel)


	height, width = image.shape[:2]
	new_width = 800
	new_height = int((new_width / width) * height)
	image = cv2.resize(image, (new_width, new_height))

	return image

	def imageRotation(image):
	"""Dummy function for now."""
	return image

	def vision_ai_api(image, label):
	"""Dummy function simulating API call. Returns dummy JSON response."""
	return {
	"label": label,
	"extracted_data": {
	"name": "-------",
	"dob": "-------",
	"id_number": "-------"
	}
	}

	def predict(image):
	image = preprocess_image(image)

	results = model(image, conf=0.80)

	detected_classes = set()
	labels = []
	cropped_images = {}

	for result in results:
	for box in result.boxes:
	x1, y1, x2, y2 = map(int, box.xyxy[0])
	conf = box.conf[0]
	cls = int(box.cls[0])
	class_name = model.names[cls]

	print(f"Detected: {class_name} ({conf:.2f}) at [{x1}, {y1}, {x2}, {y2}]")

	detected_classes.add(class_name)
	labels.append(f"{class_name} {conf:.2f}")

	# Ensure bounding boxes are within the image
	height, width = image.shape[:2]
	x1, y1, x2, y2 = max(0, x1), max(0, y1), min(width, x2), min(height, y2)

	if x1 >= x2 or y1 >= y2:
	print("Invalid bounding box, skipping.")
	continue

	cropped = image[y1:y2, x1:x2]
	cropped_pil = Image.fromarray(cropped)

	# Call API
	api_response = vision_ai_api(cropped_pil, class_name)
	cropped_images[class_name] = {"image": cropped_pil, "api_response": json.dumps(api_response, indent=4)}

	if not cropped_images:
	return None, "No front detected", None, "No back detected", ["No valid detections"]

	return (
	cropped_images.get("front", {}).get("image", None),
	cropped_images.get("front", {}).get("api_response", "{}"),
	cropped_images.get("back", {}).get("image", None),
	cropped_images.get("back", {}).get("api_response", "{}"),
	labels
	)


	# Gradio Interface
	iface = gr.Interface(
	fn=predict,
	inputs="image",
	outputs=["image", "text"],
	title="License Field Detection (Front & Back Card)",
	description="Detect front & back of a license card, crop the images, and call Vision AI API separately for each."
	)

	iface.launch()