Spaces:

lofrienger
/

polypseg

Sleeping

App Files Files Community

lofrienger commited on Dec 18, 2023

Commit

a37c14e

1 Parent(s): 9da2171

init

Browse files

Files changed (3) hide show

app.py +53 -0
unet.py +372 -0
unet_model.pth +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,53 @@

+# Import necessary libraries and load the model
+import gradio as gr
+import torch
+import numpy as np
+from PIL import Image
+from torchvision import transforms
+from unet import UNet  # Assuming UNet is the model class
+MEAN = np.array([0.4732661 , 0.44874457, 0.3948762 ], dtype=np.float32)
+STD = np.array([0.22674961, 0.22012031, 0.2238305 ], dtype=np.float32)
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+model = UNet(in_chns=3, class_num=2)  # Initialize your model
+model.load_state_dict(torch.load('unet_model.pth'))
+model = model.to(device)
+model.eval()
+# Define the segmentation function
+def segment(img):
+    img = Image.fromarray(img.astype('uint8'), 'RGB')
+    original_size = img.size  # Store the original size
+    img = img.resize((224, 224), Image.BILINEAR)
+    img = transforms.ToTensor()(img)
+    for i in range(3):
+        img[:, :, i] -= float(MEAN[i])
+    for i in range(3):
+        img[:, :, i] /= float(STD[i])
+    img = img.unsqueeze(0).to(device)
+    with torch.no_grad():
+        output = model(img)
+    output = torch.argmax(torch.softmax(output, dim=1), dim=1).squeeze().cpu().numpy()
+    # Resize the mask back to the original image size
+    output = Image.fromarray(output.astype('uint8')).resize(original_size, resample=Image.BILINEAR)
+    # Convert the PIL Image back to a numpy array
+    output = np.array(output)
+    binary_mask = np.zeros_like(output)
+    binary_mask[output > 0] = 255
+    return binary_mask
+# Create a Gradio interface
+iface = gr.Interface(fn=segment, inputs="image", outputs="image", title="Segmentation Model",
+    description="Segment objects in an image.",
+    allow_flagging=False)
+# Launch the interface
+iface.launch()

unet.py ADDED Viewed

	@@ -0,0 +1,372 @@

+# -*- coding: utf-8 -*-
+"""
+The implementation is borrowed from: https://github.com/HiLab-git/PyMIC
+"""
+from __future__ import division, print_function
+import numpy as np
+import torch
+import torch.nn as nn
+from torch.distributions.uniform import Uniform
+class ConvBlock(nn.Module):
+    """two convolution layers with batch norm and leaky relu"""
+    def __init__(self, in_channels, out_channels, dropout_p):
+        super(ConvBlock, self).__init__()
+        self.conv_conv = nn.Sequential(
+            nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1),
+            nn.BatchNorm2d(out_channels),
+            nn.LeakyReLU(),
+            nn.Dropout(dropout_p),
+            nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1),
+            nn.BatchNorm2d(out_channels),
+            nn.LeakyReLU()
+        )
+    def forward(self, x):
+        return self.conv_conv(x)
+class DownBlock(nn.Module):
+    """Downsampling followed by ConvBlock"""
+    def __init__(self, in_channels, out_channels, dropout_p):
+        super(DownBlock, self).__init__()
+        self.maxpool_conv = nn.Sequential(
+            nn.MaxPool2d(2),
+            ConvBlock(in_channels, out_channels, dropout_p)
+        )
+    def forward(self, x):
+        return self.maxpool_conv(x)
+class UpBlock(nn.Module):
+    """Upssampling followed by ConvBlock"""
+    def __init__(self, in_channels1, in_channels2, out_channels, dropout_p,
+                 bilinear=True):
+        super(UpBlock, self).__init__()
+        self.bilinear = bilinear
+        if self.bilinear != 'convtrans':
+            self.conv1x1 = nn.Conv2d(in_channels1, in_channels2, kernel_size=1)
+            self.up = nn.Upsample(scale_factor=2, mode=self.bilinear)
+            if self.bilinear != 'nearest':
+                self.up = nn.Upsample(scale_factor=2, mode=self.bilinear, align_corners=True)
+        else:
+            self.up = nn.ConvTranspose2d(
+                in_channels1, in_channels2, kernel_size=2, stride=2)
+        self.conv = ConvBlock(in_channels2 * 2, out_channels, dropout_p)
+    def forward(self, x1, x2):
+        if self.bilinear != 'convtrans':
+            x1 = self.conv1x1(x1)
+        x1 = self.up(x1)
+        x = torch.cat([x2, x1], dim=1)
+        return self.conv(x)
+class Encoder(nn.Module):
+    def __init__(self, params):
+        super(Encoder, self).__init__()
+        self.params = params
+        self.in_chns = self.params['in_chns']
+        self.ft_chns = self.params['feature_chns']
+        self.n_class = self.params['class_num']
+        self.bilinear = self.params['bilinear']
+        self.dropout = self.params['dropout']
+        assert (len(self.ft_chns) == 5)
+        self.in_conv = ConvBlock(
+            self.in_chns, self.ft_chns[0], self.dropout[0])
+        self.down1 = DownBlock(
+            self.ft_chns[0], self.ft_chns[1], self.dropout[1])
+        self.down2 = DownBlock(
+            self.ft_chns[1], self.ft_chns[2], self.dropout[2])
+        self.down3 = DownBlock(
+            self.ft_chns[2], self.ft_chns[3], self.dropout[3])
+        self.down4 = DownBlock(
+            self.ft_chns[3], self.ft_chns[4], self.dropout[4])
+    def forward(self, x):
+        x0 = self.in_conv(x)
+        x1 = self.down1(x0)
+        x2 = self.down2(x1)
+        x3 = self.down3(x2)
+        x4 = self.down4(x3)
+        return [x0, x1, x2, x3, x4]
+class Decoder(nn.Module):
+    def __init__(self, params):
+        super(Decoder, self).__init__()
+        self.params = params
+        self.in_chns = self.params['in_chns']
+        self.ft_chns = self.params['feature_chns']
+        self.n_class = self.params['class_num']
+        self.bilinear = self.params['bilinear']
+        assert (len(self.ft_chns) == 5)
+        self.up1 = UpBlock(
+            self.ft_chns[4], self.ft_chns[3], self.ft_chns[3], dropout_p=0.0, bilinear=self.bilinear)
+        self.up2 = UpBlock(
+            self.ft_chns[3], self.ft_chns[2], self.ft_chns[2], dropout_p=0.0, bilinear=self.bilinear)
+        self.up3 = UpBlock(
+            self.ft_chns[2], self.ft_chns[1], self.ft_chns[1], dropout_p=0.0, bilinear=self.bilinear)
+        self.up4 = UpBlock(
+            self.ft_chns[1], self.ft_chns[0], self.ft_chns[0], dropout_p=0.0, bilinear=self.bilinear)
+        self.out_conv = nn.Conv2d(self.ft_chns[0], self.n_class,
+                                  kernel_size=3, padding=1)
+    def forward(self, feature):
+        x0 = feature[0]
+        x1 = feature[1]
+        x2 = feature[2]
+        x3 = feature[3]
+        x4 = feature[4]
+        x = self.up1(x4, x3)
+        x = self.up2(x, x2)
+        x = self.up3(x, x1)
+        x = self.up4(x, x0)
+        output = self.out_conv(x)
+        return output
+class Decoder_DS(nn.Module):
+    def __init__(self, params):
+        super(Decoder_DS, self).__init__()
+        self.params = params
+        self.in_chns = self.params['in_chns']
+        self.ft_chns = self.params['feature_chns']
+        self.n_class = self.params['class_num']
+        self.bilinear = self.params['bilinear']
+        assert (len(self.ft_chns) == 5)
+        self.up1 = UpBlock(
+            self.ft_chns[4], self.ft_chns[3], self.ft_chns[3], dropout_p=0.0)
+        self.up2 = UpBlock(
+            self.ft_chns[3], self.ft_chns[2], self.ft_chns[2], dropout_p=0.0)
+        self.up3 = UpBlock(
+            self.ft_chns[2], self.ft_chns[1], self.ft_chns[1], dropout_p=0.0)
+        self.up4 = UpBlock(
+            self.ft_chns[1], self.ft_chns[0], self.ft_chns[0], dropout_p=0.0)
+        self.out_conv = nn.Conv2d(self.ft_chns[0], self.n_class,
+                                  kernel_size=3, padding=1)
+        self.out_conv_dp4 = nn.Conv2d(self.ft_chns[4], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp3 = nn.Conv2d(self.ft_chns[3], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp2 = nn.Conv2d(self.ft_chns[2], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp1 = nn.Conv2d(self.ft_chns[1], self.n_class,
+                                      kernel_size=3, padding=1)
+    def forward(self, feature, shape):
+        x0 = feature[0]
+        x1 = feature[1]
+        x2 = feature[2]
+        x3 = feature[3]
+        x4 = feature[4]
+        x = self.up1(x4, x3)
+        dp3_out_seg = self.out_conv_dp3(x)
+        dp3_out_seg = torch.nn.functional.interpolate(dp3_out_seg, shape)
+        x = self.up2(x, x2)
+        dp2_out_seg = self.out_conv_dp2(x)
+        dp2_out_seg = torch.nn.functional.interpolate(dp2_out_seg, shape)
+        x = self.up3(x, x1)
+        dp1_out_seg = self.out_conv_dp1(x)
+        dp1_out_seg = torch.nn.functional.interpolate(dp1_out_seg, shape)
+        x = self.up4(x, x0)
+        dp0_out_seg = self.out_conv(x)
+        return dp0_out_seg, dp1_out_seg, dp2_out_seg, dp3_out_seg
+class Decoder_URDS(nn.Module):
+    def __init__(self, params):
+        super(Decoder_URDS, self).__init__()
+        self.params = params
+        self.in_chns = self.params['in_chns']
+        self.ft_chns = self.params['feature_chns']
+        self.n_class = self.params['class_num']
+        self.bilinear = self.params['bilinear']
+        assert (len(self.ft_chns) == 5)
+        self.up1 = UpBlock(
+            self.ft_chns[4], self.ft_chns[3], self.ft_chns[3], dropout_p=0.0)
+        self.up2 = UpBlock(
+            self.ft_chns[3], self.ft_chns[2], self.ft_chns[2], dropout_p=0.0)
+        self.up3 = UpBlock(
+            self.ft_chns[2], self.ft_chns[1], self.ft_chns[1], dropout_p=0.0)
+        self.up4 = UpBlock(
+            self.ft_chns[1], self.ft_chns[0], self.ft_chns[0], dropout_p=0.0)
+        self.out_conv = nn.Conv2d(self.ft_chns[0], self.n_class,
+                                  kernel_size=3, padding=1)
+        self.out_conv_dp4 = nn.Conv2d(self.ft_chns[4], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp3 = nn.Conv2d(self.ft_chns[3], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp2 = nn.Conv2d(self.ft_chns[2], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.out_conv_dp1 = nn.Conv2d(self.ft_chns[1], self.n_class,
+                                      kernel_size=3, padding=1)
+        self.feature_noise = FeatureNoise()
+    def forward(self, feature, shape):
+        x0 = feature[0]
+        x1 = feature[1]
+        x2 = feature[2]
+        x3 = feature[3]
+        x4 = feature[4]
+        x = self.up1(x4, x3)
+        if self.training:
+            dp3_out_seg = self.out_conv_dp3(Dropout(x, p=0.5))
+        else:
+            dp3_out_seg = self.out_conv_dp3(x)
+        dp3_out_seg = torch.nn.functional.interpolate(dp3_out_seg, shape)
+        x = self.up2(x, x2)
+        if self.training:
+            dp2_out_seg = self.out_conv_dp2(FeatureDropout(x))
+        else:
+            dp2_out_seg = self.out_conv_dp2(x)
+        dp2_out_seg = torch.nn.functional.interpolate(dp2_out_seg, shape)
+        x = self.up3(x, x1)
+        if self.training:
+            dp1_out_seg = self.out_conv_dp1(self.feature_noise(x))
+        else:
+            dp1_out_seg = self.out_conv_dp1(x)
+        dp1_out_seg = torch.nn.functional.interpolate(dp1_out_seg, shape)
+        x = self.up4(x, x0)
+        dp0_out_seg = self.out_conv(x)
+        return dp0_out_seg, dp1_out_seg, dp2_out_seg, dp3_out_seg
+def Dropout(x, p=0.5):
+    x = torch.nn.functional.dropout2d(x, p)
+    return x
+def FeatureDropout(x):
+    attention = torch.mean(x, dim=1, keepdim=True)
+    max_val, _ = torch.max(attention.view(
+        x.size(0), -1), dim=1, keepdim=True)
+    threshold = max_val * np.random.uniform(0.7, 0.9)
+    threshold = threshold.view(x.size(0), 1, 1, 1).expand_as(attention)
+    drop_mask = (attention < threshold).float()
+    x = x.mul(drop_mask)
+    return x
+class FeatureNoise(nn.Module):
+    def __init__(self, uniform_range=0.3):
+        super(FeatureNoise, self).__init__()
+        self.uni_dist = Uniform(-uniform_range, uniform_range)
+    def feature_based_noise(self, x):
+        noise_vector = self.uni_dist.sample(
+            x.shape[1:]).to(x.device).unsqueeze(0)
+        x_noise = x.mul(noise_vector) + x
+        return x_noise
+    def forward(self, x):
+        x = self.feature_based_noise(x)
+        return x
+class UNet(nn.Module):
+    def __init__(self, in_chns, class_num):
+        super(UNet, self).__init__()
+        params = {'in_chns': in_chns,
+                  'feature_chns': [16, 32, 64, 128, 256],
+                  'dropout': [0.05, 0.1, 0.2, 0.3, 0.5],
+                  'class_num': class_num,
+                  'bilinear': 'nearest',
+                  'acti_func': 'relu'}
+        self.encoder = Encoder(params)
+        self.decoder = Decoder(params)
+    def forward(self, x):
+        feature = self.encoder(x)
+        output = self.decoder(feature)
+        return output
+class UNet_DS(nn.Module):
+    def __init__(self, in_chns, class_num):
+        super(UNet_DS, self).__init__()
+        params = {'in_chns': in_chns,
+                  'feature_chns': [16, 32, 64, 128, 256],
+                  'dropout': [0.05, 0.1, 0.2, 0.3, 0.5],
+                  'class_num': class_num,
+                  'bilinear': False,
+                  'acti_func': 'relu'}
+        self.encoder = Encoder(params)
+        self.decoder = Decoder_DS(params)
+    def forward(self, x):
+        shape = x.shape[2:]
+        feature = self.encoder(x)
+        dp0_out_seg, dp1_out_seg, dp2_out_seg, dp3_out_seg = self.decoder(
+            feature, shape)
+        return dp0_out_seg, dp1_out_seg, dp2_out_seg, dp3_out_seg
+class UNet_CCT(nn.Module):
+    def __init__(self, in_chns, class_num):
+        super(UNet_CCT, self).__init__()
+        params = {'in_chns': in_chns,
+                  'feature_chns': [16, 32, 64, 128, 256],
+                  'dropout': [0.05, 0.1, 0.2, 0.3, 0.5],
+                  'class_num': class_num,
+                  'bilinear': 'nearest',
+                  'acti_func': 'relu'}
+        self.encoder = Encoder(params)
+        self.main_decoder = Decoder(params)
+        self.aux_decoder1 = Decoder(params)
+    def forward(self, x):
+        feature = self.encoder(x)
+        main_seg = self.main_decoder(feature)
+        aux1_feature = [Dropout(i) for i in feature]
+        aux_seg1 = self.aux_decoder1(aux1_feature)
+        return main_seg, aux_seg1
+class UNet_CCT_3H(nn.Module):
+    def __init__(self, in_chns, class_num):
+        super(UNet_CCT_3H, self).__init__()
+        params = {'in_chns': in_chns,
+                  'feature_chns': [16, 32, 64, 128, 256],
+                  'dropout': [0.05, 0.1, 0.2, 0.3, 0.5],
+                  'class_num': class_num,
+                  'bilinear': False,
+                  'acti_func': 'relu'}
+        self.encoder = Encoder(params)
+        self.main_decoder = Decoder(params)
+        self.aux_decoder1 = Decoder(params)
+        self.aux_decoder2 = Decoder(params)
+    def forward(self, x):
+        feature = self.encoder(x)
+        main_seg = self.main_decoder(feature)
+        aux1_feature = [Dropout(i) for i in feature]
+        aux_seg1 = self.aux_decoder1(aux1_feature)
+        aux2_feature = [FeatureNoise()(i) for i in feature]
+        aux_seg2 = self.aux_decoder1(aux2_feature)
+        return main_seg, aux_seg1, aux_seg2

unet_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a1747468feb2005f81ff818f234f8358553ec017c6c1603dc5e046f2fc6ea39
+size 7316273