semantic-10

Sleeping

App Files Files Community

adpro commited on Feb 10, 2023

Commit

a4a91be

1 Parent(s): ce4e094

Update app.py

Browse files

Files changed (1) hide show

app.py +243 -29

app.py CHANGED Viewed

@@ -1,37 +1,251 @@
-from torch import torch.hub
-import gluoncv
-import mxnet as mx
-from gluoncv.utils.viz import get_color_pallete
-import gradio as gr
 import numpy as np
-from PIL import Image
-from gluoncv.data.transforms.presets.segmentation import test_transform
-# using cpu
-ctx = mx.cpu(0)
-model = torch.hub.load("kazuto1011/deeplab-pytorch", "deeplabv2_resnet101", pretrained='cocostuff164k', n_classes=182)
-def segmentation(image):
-    img = Image.fromarray(image)
-    img = mx.ndarray.array(img)
-    img = test_transform(img, ctx)
-    output = model.predict(img)
-    predict = mx.nd.squeeze(mx.nd.argmax(output, 1)).asnumpy()
-    mask = get_color_pallete(predict, "ade20k")
-    return mask
-image_in = gr.Image()
-image_out = gr.components.Image()
-description = "MXNet Image Segmentation Model"
-examples=['cat.jpeg']
-Iface = gr.Interface(
-    fn=segmentation,
-    inputs=image_in,
-    outputs=image_out,
-    title="Semantic Segmentation - MXNet",
-    examples=examples
-).launch()

+from __future__ import absolute_import, division, print_function
+import click
+import cv2
+import matplotlib
+import matplotlib.cm as cm
+import matplotlib.pyplot as plt
 import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from omegaconf import OmegaConf
+from libs.models import *
+from libs.utils import DenseCRF
+def get_device(cuda):
+    cuda = cuda and torch.cuda.is_available()
+    device = torch.device("cuda" if cuda else "cpu")
+    if cuda:
+        current_device = torch.cuda.current_device()
+        print("Device:", torch.cuda.get_device_name(current_device))
+    else:
+        print("Device: CPU")
+    return device
+def get_classtable(CONFIG):
+    with open(CONFIG.DATASET.LABELS) as f:
+        classes = {}
+        for label in f:
+            label = label.rstrip().split("\t")
+            classes[int(label[0])] = label[1].split(",")[0]
+    return classes
+def setup_postprocessor(CONFIG):
+    # CRF post-processor
+    postprocessor = DenseCRF(
+        iter_max=CONFIG.CRF.ITER_MAX,
+        pos_xy_std=CONFIG.CRF.POS_XY_STD,
+        pos_w=CONFIG.CRF.POS_W,
+        bi_xy_std=CONFIG.CRF.BI_XY_STD,
+        bi_rgb_std=CONFIG.CRF.BI_RGB_STD,
+        bi_w=CONFIG.CRF.BI_W,
+    )
+    return postprocessor
+def preprocessing(image, device, CONFIG):
+    # Resize
+    scale = CONFIG.IMAGE.SIZE.TEST / max(image.shape[:2])
+    image = cv2.resize(image, dsize=None, fx=scale, fy=scale)
+    raw_image = image.astype(np.uint8)
+    # Subtract mean values
+    image = image.astype(np.float32)
+    image -= np.array(
+        [
+            float(CONFIG.IMAGE.MEAN.B),
+            float(CONFIG.IMAGE.MEAN.G),
+            float(CONFIG.IMAGE.MEAN.R),
+        ]
+    )
+    # Convert to torch.Tensor and add "batch" axis
+    image = torch.from_numpy(image.transpose(2, 0, 1)).float().unsqueeze(0)
+    image = image.to(device)
+    return image, raw_image
+def inference(model, image, raw_image=None, postprocessor=None):
+    _, _, H, W = image.shape
+    # Image -> Probability map
+    logits = model(image)
+    logits = F.interpolate(logits, size=(H, W), mode="bilinear", align_corners=False)
+    probs = F.softmax(logits, dim=1)[0]
+    probs = probs.cpu().numpy()
+    # Refine the prob map with CRF
+    if postprocessor and raw_image is not None:
+        probs = postprocessor(raw_image, probs)
+    labelmap = np.argmax(probs, axis=0)
+    return labelmap
+@click.group()
+@click.pass_context
+def main(ctx):
+    """
+    Demo with a trained model
+    """
+    print("Mode:", ctx.invoked_subcommand)
+@main.command()
+@click.option(
+    "-c",
+    "--config-path",
+    type=click.File(),
+    required=True,
+    help="Dataset configuration file in YAML",
+)
+@click.option(
+    "-m",
+    "--model-path",
+    type=click.Path(exists=True),
+    required=True,
+    help="PyTorch model to be loaded",
+)
+@click.option(
+    "-i",
+    "--image-path",
+    type=click.Path(exists=True),
+    required=True,
+    help="Image to be processed",
+)
+@click.option(
+    "--cuda/--cpu", default=True, help="Enable CUDA if available [default: --cuda]"
+)
+@click.option("--crf", is_flag=True, show_default=True, help="CRF post-processing")
+def single(config_path, model_path, image_path, cuda, crf):
+    """
+    Inference from a single image
+    """
+    # Setup
+    CONFIG = OmegaConf.load(config_path)
+    device = get_device(cuda)
+    torch.set_grad_enabled(False)
+    classes = get_classtable(CONFIG)
+    postprocessor = setup_postprocessor(CONFIG) if crf else None
+    model = eval(CONFIG.MODEL.NAME)(n_classes=CONFIG.DATASET.N_CLASSES)
+    state_dict = torch.load(model_path, map_location=lambda storage, loc: storage)
+    model.load_state_dict(state_dict)
+    model.eval()
+    model.to(device)
+    print("Model:", CONFIG.MODEL.NAME)
+    # Inference
+    image = cv2.imread(image_path, cv2.IMREAD_COLOR)
+    image, raw_image = preprocessing(image, device, CONFIG)
+    labelmap = inference(model, image, raw_image, postprocessor)
+    labels = np.unique(labelmap)
+    # Show result for each class
+    rows = np.floor(np.sqrt(len(labels) + 1))
+    cols = np.ceil((len(labels) + 1) / rows)
+    plt.figure(figsize=(10, 10))
+    ax = plt.subplot(rows, cols, 1)
+    ax.set_title("Input image")
+    ax.imshow(raw_image[:, :, ::-1])
+    ax.axis("off")
+    for i, label in enumerate(labels):
+        mask = labelmap == label
+        ax = plt.subplot(rows, cols, i + 2)
+        ax.set_title(classes[label])
+        ax.imshow(raw_image[..., ::-1])
+        ax.imshow(mask.astype(np.float32), alpha=0.5)
+        ax.axis("off")
+    plt.tight_layout()
+    plt.show()
+@main.command()
+@click.option(
+    "-c",
+    "--config-path",
+    type=click.File(),
+    required=True,
+    help="Dataset configuration file in YAML",
+)
+@click.option(
+    "-m",
+    "--model-path",
+    type=click.Path(exists=True),
+    required=True,
+    help="PyTorch model to be loaded",
+)
+@click.option(
+    "--cuda/--cpu", default=True, help="Enable CUDA if available [default: --cuda]"
+)
+@click.option("--crf", is_flag=True, show_default=True, help="CRF post-processing")
+@click.option("--camera-id", type=int, default=0, show_default=True, help="Device ID")
+def live(config_path, model_path, cuda, crf, camera_id):
+    """
+    Inference from camera stream
+    """
+    # Setup
+    CONFIG = OmegaConf.load(config_path)
+    device = get_device(cuda)
+    torch.set_grad_enabled(False)
+    torch.backends.cudnn.benchmark = True
+    classes = get_classtable(CONFIG)
+    postprocessor = setup_postprocessor(CONFIG) if crf else None
+    model = eval(CONFIG.MODEL.NAME)(n_classes=CONFIG.DATASET.N_CLASSES)
+    state_dict = torch.load(model_path, map_location=lambda storage, loc: storage)
+    model.load_state_dict(state_dict)
+    model.eval()
+    model.to(device)
+    print("Model:", CONFIG.MODEL.NAME)
+    # UVC camera stream
+    cap = cv2.VideoCapture(camera_id)
+    cap.set(cv2.CAP_PROP_FOURCC, cv2.VideoWriter_fourcc(*"YUYV"))
+    def colorize(labelmap):
+        # Assign a unique color to each label
+        labelmap = labelmap.astype(np.float32) / CONFIG.DATASET.N_CLASSES
+        colormap = cm.jet_r(labelmap)[..., :-1] * 255.0
+        return np.uint8(colormap)
+    def mouse_event(event, x, y, flags, labelmap):
+        # Show a class name of a mouse-overed pixel
+        label = labelmap[y, x]
+        name = classes[label]
+        print(name)
+    window_name = "{} + {}".format(CONFIG.MODEL.NAME, CONFIG.DATASET.NAME)
+    cv2.namedWindow(window_name, cv2.WINDOW_AUTOSIZE)
+    while True:
+        _, frame = cap.read()
+        image, raw_image = preprocessing(frame, device, CONFIG)
+        labelmap = inference(model, image, raw_image, postprocessor)
+        colormap = colorize(labelmap)
+        # Register mouse callback function
+        cv2.setMouseCallback(window_name, mouse_event, labelmap)
+        # Overlay prediction
+        cv2.addWeighted(colormap, 0.5, raw_image, 0.5, 0.0, raw_image)
+        # Quit by pressing "q" key
+        cv2.imshow(window_name, raw_image)
+        if cv2.waitKey(10) == ord("q"):
+            break