Upload folder using huggingface_hub

4e9f8f2 verified 7 months ago

11 kB

	import numpy as np
	import gradio as gr
	import cv2
	from copy import deepcopy
	import torch
	from torchvision import transforms
	from PIL import Image, ImageDraw, ImageFont

	from sam.efficient_sam.build_efficient_sam import build_efficient_sam_vits
	from src.utils.utils import resize_numpy_image

	sam = build_efficient_sam_vits()

	def show_point_or_box(image, global_points):
	# for point
	if len(global_points) == 1:
	image = cv2.circle(image, global_points[0], 10, (0, 0, 255), -1)
	# for box
	if len(global_points) == 2:
	p1 = global_points[0]
	p2 = global_points[1]
	image = cv2.rectangle(image,(int(p1[0]),int(p1[1])),(int(p2[0]),int(p2[1])),(0,0,255),2)

	return image

	def segment_with_points(
	image,
	original_image,
	global_points,
	global_point_label,
	evt: gr.SelectData,
	img_direction,
	save_dir = "./tmp"
	):
	if original_image is None:
	original_image = image
	else:
	image = original_image
	if img_direction is None:
	img_direction = original_image
	x, y = evt.index[0], evt.index[1]
	image_path = None
	mask_path = None
	if len(global_points) == 0:
	global_points.append([x, y])
	global_point_label.append(2)
	image_with_point= show_point_or_box(image.copy(), global_points)
	return image_with_point, original_image, None, global_points, global_point_label
	elif len(global_points) == 1:
	global_points.append([x, y])
	global_point_label.append(3)
	x1, y1 = global_points[0]
	x2, y2 = global_points[1]
	if x1 < x2 and y1 >= y2:
	global_points[0][0] = x1
	global_points[0][1] = y2
	global_points[1][0] = x2
	global_points[1][1] = y1
	elif x1 >= x2 and y1 < y2:
	global_points[0][0] = x2
	global_points[0][1] = y1
	global_points[1][0] = x1
	global_points[1][1] = y2
	elif x1 >= x2 and y1 >= y2:
	global_points[0][0] = x2
	global_points[0][1] = y2
	global_points[1][0] = x1
	global_points[1][1] = y1
	image_with_point = show_point_or_box(image.copy(), global_points)
	# data process
	input_point = np.array(global_points)
	input_label = np.array(global_point_label)
	pts_sampled = torch.reshape(torch.tensor(input_point), [1, 1, -1, 2])
	pts_labels = torch.reshape(torch.tensor(input_label), [1, 1, -1])
	img_tensor = transforms.ToTensor()(image)
	# sam
	predicted_logits, predicted_iou = sam(
	img_tensor[None, ...],
	pts_sampled,
	pts_labels,
	)
	mask = torch.ge(predicted_logits[0, 0, 0, :, :], 0).float().cpu().detach().numpy()
	mask_image = (mask*255.).astype(np.uint8)
	return image_with_point, original_image, mask_image, global_points, global_point_label
	else:
	global_points=[[x, y]]
	global_point_label=[2]
	image_with_point= show_point_or_box(image.copy(), global_points)
	return image_with_point, original_image, None, global_points, global_point_label


	def segment_with_points_paste(
	image,
	original_image,
	global_points,
	global_point_label,
	image_b,
	evt: gr.SelectData,
	dx,
	dy,
	resize_scale

	):
	if original_image is None:
	original_image = image
	else:
	image = original_image
	x, y = evt.index[0], evt.index[1]
	if len(global_points) == 0:
	global_points.append([x, y])
	global_point_label.append(2)
	image_with_point= show_point_or_box(image.copy(), global_points)
	return image_with_point, original_image, None, global_points, global_point_label, None
	elif len(global_points) == 1:
	global_points.append([x, y])
	global_point_label.append(3)
	x1, y1 = global_points[0]
	x2, y2 = global_points[1]
	if x1 < x2 and y1 >= y2:
	global_points[0][0] = x1
	global_points[0][1] = y2
	global_points[1][0] = x2
	global_points[1][1] = y1
	elif x1 >= x2 and y1 < y2:
	global_points[0][0] = x2
	global_points[0][1] = y1
	global_points[1][0] = x1
	global_points[1][1] = y2
	elif x1 >= x2 and y1 >= y2:
	global_points[0][0] = x2
	global_points[0][1] = y2
	global_points[1][0] = x1
	global_points[1][1] = y1
	image_with_point = show_point_or_box(image.copy(), global_points)
	# data process
	input_point = np.array(global_points)
	input_label = np.array(global_point_label)
	pts_sampled = torch.reshape(torch.tensor(input_point), [1, 1, -1, 2])
	pts_labels = torch.reshape(torch.tensor(input_label), [1, 1, -1])
	img_tensor = transforms.ToTensor()(image)
	# sam
	predicted_logits, predicted_iou = sam(
	img_tensor[None, ...],
	pts_sampled,
	pts_labels,
	)
	mask = torch.ge(predicted_logits[0, 0, 0, :, :], 0).float().cpu().detach().numpy()
	mask_uint8 = (mask*255.).astype(np.uint8)

	return image_with_point, original_image, paste_with_mask_and_offset(image, image_b, mask_uint8, dx, dy, resize_scale), global_points, global_point_label, mask_uint8
	else:
	global_points=[[x, y]]
	global_point_label=[2]
	image_with_point= show_point_or_box(image.copy(), global_points)
	return image_with_point, original_image, None, global_points, global_point_label, None

	def paste_with_mask_and_offset(image_a, image_b, mask, x_offset=0, y_offset=0, delta=1):
	try:
	numpy_mask = np.array(mask)
	y_coords, x_coords = np.nonzero(numpy_mask)
	x_min = x_coords.min()
	x_max = x_coords.max()
	y_min = y_coords.min()
	y_max = y_coords.max()
	target_center_x = int((x_min + x_max) / 2)
	target_center_y = int((y_min + y_max) / 2)

	image_a = Image.fromarray(image_a)
	image_b = Image.fromarray(image_b)
	mask = Image.fromarray(mask)

	if image_a.size != mask.size:
	mask = mask.resize(image_a.size)

	cropped_image = Image.composite(image_a, Image.new('RGBA', image_a.size, (0, 0, 0, 0)), mask)
	x_b = int(target_center_x * (image_b.width / cropped_image.width))
	y_b = int(target_center_y * (image_b.height / cropped_image.height))
	x_offset = x_offset - int((delta - 1) * x_b)
	y_offset = y_offset - int((delta - 1) * y_b)
	cropped_image = cropped_image.resize(image_b.size)
	new_size = (int(cropped_image.width * delta), int(cropped_image.height * delta))
	cropped_image = cropped_image.resize(new_size)
	image_b.putalpha(128)
	result_image = Image.new('RGBA', image_b.size, (0, 0, 0, 0))
	result_image.paste(image_b, (0, 0))
	result_image.paste(cropped_image, (x_offset, y_offset), mask=cropped_image)

	return result_image
	except:
	return None

	def upload_image_move(img, original_image):
	if original_image is not None:
	return original_image
	else:
	return img

	def fun_clear(*args):
	result = []
	for arg in args:
	if isinstance(arg, list):
	result.append([])
	else:
	result.append(None)
	return tuple(result)

	def clear_points(img):
	image, mask = img["image"], np.float32(img["mask"][:, :, 0]) / 255.
	if mask.sum() > 0:
	mask = np.uint8(mask > 0)
	masked_img = mask_image(image, 1 - mask, color=[0, 0, 0], alpha=0.3)
	else:
	masked_img = image.copy()

	return [], masked_img

	def get_point(img, sel_pix, evt: gr.SelectData):
	sel_pix.append(evt.index)
	points = []
	for idx, point in enumerate(sel_pix):
	if idx % 2 == 0:
	cv2.circle(img, tuple(point), 10, (0, 0, 255), -1)
	else:
	cv2.circle(img, tuple(point), 10, (255, 0, 0), -1)
	points.append(tuple(point))
	if len(points) == 2:
	cv2.arrowedLine(img, points[0], points[1], (255, 255, 255), 4, tipLength=0.5)
	points = []
	return img if isinstance(img, np.ndarray) else np.array(img)

	def calculate_translation_percentage(ori_shape, selected_points):
	dx = selected_points[1][0] - selected_points[0][0]
	dy = selected_points[1][1] - selected_points[0][1]
	dx_percentage = dx / ori_shape[1]
	dy_percentage = dy / ori_shape[0]

	return dx_percentage, dy_percentage

	def get_point_move(original_image, img, sel_pix, evt: gr.SelectData):
	if original_image is not None:
	img = original_image.copy()
	else:
	original_image = img.copy()
	if len(sel_pix)<2:
	sel_pix.append(evt.index)
	else:
	sel_pix = [evt.index]
	points = []
	dx, dy = 0, 0
	for idx, point in enumerate(sel_pix):
	if idx % 2 == 0:
	cv2.circle(img, tuple(point), 10, (0, 0, 255), -1)
	else:
	cv2.circle(img, tuple(point), 10, (255, 0, 0), -1)
	points.append(tuple(point))
	if len(points) == 2:
	cv2.arrowedLine(img, points[0], points[1], (255, 255, 255), 4, tipLength=0.5)
	ori_shape = original_image.shape
	dx, dy = calculate_translation_percentage(original_image.shape, sel_pix)
	points = []
	img = np.array(img)

	return img, original_image, sel_pix, dx, dy

	def store_img(img):
	image, mask = img["image"], np.float32(img["mask"][:, :, 0]) / 255.
	if mask.sum() > 0:
	mask = np.uint8(mask > 0)
	masked_img = mask_image(image, 1 - mask, color=[0, 0, 0], alpha=0.3)
	else:
	masked_img = image.copy()

	return image, masked_img, mask

	def store_img_move(img, mask=None):
	if mask is not None:
	image = img["image"]
	return image, None, mask
	image, mask = img["image"], np.float32(img["mask"][:, :, 0]) / 255.
	if mask.sum() > 0:
	mask = np.uint8(mask > 0)
	masked_img = mask_image(image, 1 - mask, color=[0, 0, 0], alpha=0.3)
	else:
	masked_img = image.copy()

	return image, masked_img, (mask*255.).astype(np.uint8)

	def mask_image(image, mask, color=[255,0,0], alpha=0.5, max_resolution=None):
	""" Overlay mask on image for visualization purpose.
	Args:
	image (H, W, 3) or (H, W): input image
	mask (H, W): mask to be overlaid
	color: the color of overlaid mask
	alpha: the transparency of the mask
	"""
	if max_resolution is not None:
	image, _ = resize_numpy_image(image, max_resolution*max_resolution)
	mask = cv2.resize(mask, (image.shape[1], image.shape[0]),interpolation=cv2.INTER_NEAREST)

	out = deepcopy(image)
	img = deepcopy(image)
	img[mask == 1] = color
	out = cv2.addWeighted(img, alpha, out, 1-alpha, 0, out)
	contours = cv2.findContours(np.uint8(deepcopy(mask)), cv2.RETR_TREE,
	cv2.CHAIN_APPROX_SIMPLE)[-2:]
	return out