Skip to content

Instantly share code, notes, and snippets.

Created May 18, 2020 11:03
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save satyajitghana/b24bfb66040e7dbecc0a7d4cf7d5fa32 to your computer and use it in GitHub Desktop.
Save satyajitghana/b24bfb66040e7dbecc0a7d4cf7d5fa32 to your computer and use it in GitHub Desktop.
import torch
import torch.nn as nn
class ResDoubleConv(nn.Module):
'''Basic DoubleConv of a ResNetV2'''
def __init__(self, in_channels, out_channels):
super(ResDoubleConv, self).__init__()
self.double_conv = nn.Sequential(
nn.Conv2d(in_channels, out_channels,
kernel_size=3, padding=1, bias=False),
nn.Conv2d(out_channels, out_channels,
kernel_size=3, padding=1, bias=False)
def forward(self, x):
out = self.double_conv(x)
return out
class ResDownBlock(nn.Module):
'''Basic DownBlock of a ResNetV2'''
def __init__(self, in_channels, out_channels):
super(ResDownBlock, self).__init__()
self.double_conv = ResDoubleConv(in_channels, out_channels)
self.proj_layer = nn.Sequential(
nn.Conv2d(in_channels, out_channels,
kernel_size=1, stride=1, bias=False),
self.down_sample = nn.MaxPool2d(2)
def forward(self, input):
identity = self.proj_layer(input)
out = self.double_conv(input)
out = out + identity
return self.down_sample(out), out
class ResUpBlock(nn.Module):
'''Basic UpBlock of a ResNetV2'''
def __init__(self, in_channels, out_channels):
super(ResUpBlock, self).__init__()
self.upsample_1 = nn.PixelShuffle(2)
self.upsample_2 = nn.PixelShuffle(2)
self.upsample_3 = nn.PixelShuffle(2)
self.upsample_4 = nn.PixelShuffle(2)
self.double_conv = ResDoubleConv(in_channels, out_channels)
self.proj_layer = nn.Sequential(
nn.Conv2d(in_channels, out_channels,
kernel_size=1, stride=1, bias=False),
def forward(self, down_input, skip_input, decoder_input=None):
upsampled = [self.upsample_1(down_input), self.upsample_2(
down_input), self.upsample_3(down_input), self.upsample_4(down_input)]
x =, dim=1)
x =[x, skip_input], dim=1)
if decoder_input is not None:
x =[x, decoder_input], dim=1)
identity = self.proj_layer(x)
out = self.double_conv(x) + identity
return out
class ResUNet(nn.Module):
def __init__(self):
super(ResUNet, self).__init__()
# Encoder
# H / 2 ; input = 192x192x6 ; output = 96x96x64 ; skip1 = 192x192x64
self.res_down1 = ResDownBlock(6, 64)
# H / 4 ; input = 96x96x64 ; output = 48x48x128 ; skip2 = 96x96x128
self.res_down2 = ResDownBlock(64, 128)
# H / 8 ; input = 48x48x128 ; output = 24x24x256 ; skip3 = 48x48x256
self.res_down3 = ResDownBlock(128, 256)
# H / 16 ; input = 24x24x256 ; output = 12x12x512 ; skip4 = 24x24x512
self.res_down4 = ResDownBlock(256, 512)
# Bridge
self.bridge = ResDoubleConv(512, 512)
# Depth Decoder
# H / 8 ; input = 24x24x1024(upscaled) 24x24x512(skip4) ; output = 24x24x512(dskip4)
self.d_res_up4 = ResUpBlock(512 + 512, 512)
# H / 4 ; input = 48x48x512(upscaled) 48x48x256(skip3) ; output = 48x48x256(dskip3)
self.d_res_up3 = ResUpBlock(512 + 256, 256)
# H / 2 ; input = 96x96x256(upscaled) 96x96x128(skip2) ; output = 96x96x128(dskip2)
self.d_res_up2 = ResUpBlock(256 + 128, 128)
# H / 1 ; input = 192x192x128(upscaled) 192x192x64(skip1) ; output = 192x192x64(dskip1)
self.d_res_up1 = ResUpBlock(128 + 64, 64)
# Depth Output
self.depth_output = nn.Conv2d(
64, 1, kernel_size=1, stride=1, bias=False) # output = 192x192x1
# Segmentation Decoder
# H / 8 ; input = 24x24x1024(upscaled) 24x24x512(dskip4) 24x24x512(skip4) ; output = 24x24x512
self.s_res_up4 = ResUpBlock(512 + 512 + 512, 512)
# H / 4 ; input = 48x48x512(upscaled) 48x48x256(dskip3) 48x48x256(skip3) ; output = 48x48x256
self.s_res_up3 = ResUpBlock(512 + 256 + 256, 256)
# H / 2 ; input = 96x96x256(upscaled) 96x96x128(dskip2) 96x96x128(skip2) ; output = 96x96x128
self.s_res_up2 = ResUpBlock(256 + 128 + 128, 128)
# H / 1 ; input = 192x192x128(upscaled) 192x192x64(dskip1) 192x192x64(skip1) ; output = 192x192x64
self.s_res_up1 = ResUpBlock(128 + 64 + 64, 64)
# Segmentation Output
self.segment_output = nn.Conv2d(
64, 1, kernel_size=1, stride=1, bias=False) # output = 192x192x1
def forward(self, input):
# Encoder
rd1, skip1_out = self.res_down1(input)
rd2, skip2_out = self.res_down2(rd1)
rd3, skip3_out = self.res_down3(rd2)
rd4, skip4_out = self.res_down4(rd3)
# Bridge
bridge = self.bridge(rd4)
# Depth Decoder
dru4 = self.d_res_up4(bridge, skip4_out)
dru3 = self.d_res_up3(dru4, skip3_out)
dru2 = self.d_res_up2(dru3, skip2_out)
dru1 = self.d_res_up1(dru2, skip1_out)
d_out = self.depth_output(dru1)
# Segmentation Decoder
sru4 = self.s_res_up4(bridge, skip4_out, dru4)
sru3 = self.s_res_up3(sru4, skip3_out, dru3)
sru2 = self.s_res_up2(sru3, skip2_out, dru2)
sru1 = self.s_res_up1(sru2, skip1_out, dru1)
s_out = self.segment_output(sru1)
return d_out, s_out
Total params: 34,997,388
Trainable params: 34,997,388
Non-trainable params: 0
Input size (MB): 0.84
Forward/backward pass size (MB): 14099077.69
Params size (MB): 133.50
Estimated Total Size (MB): 14099212.04
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment