From 352ed6a98791ce97cec1bfcb427ae4d38bc3ceeb Mon Sep 17 00:00:00 2001
From: ys-li <56712176+Yshuo-Li@users.noreply.github.com>
Date: Sun, 25 Apr 2021 23:37:06 +0800
Subject: [PATCH] Add RDN. (#233)

* add RDN

* Add docstring and test.

* Tiny fix.

* Tiny fix.

* Add license.

* Tiny Fix

* Tiny Fix

Co-authored-by: liyinshuo <liyinshuo@sensetime.com>
---
 mmedit/models/backbones/__init__.py           |   4 +-
 .../models/backbones/sr_backbones/__init__.py |   3 +-
 mmedit/models/backbones/sr_backbones/rdn.py   | 200 ++++++++++++++++++
 tests/test_rdn.py                             |  56 +++++
 4 files changed, 260 insertions(+), 3 deletions(-)
 create mode 100644 mmedit/models/backbones/sr_backbones/rdn.py
 create mode 100644 tests/test_rdn.py

diff --git a/mmedit/models/backbones/__init__.py b/mmedit/models/backbones/__init__.py
index 72d5ea179c..444bb01c88 100644
--- a/mmedit/models/backbones/__init__.py
+++ b/mmedit/models/backbones/__init__.py
@@ -12,7 +12,7 @@
                                SimpleEncoderDecoder)
 # yapf: enable
 from .generation_backbones import ResnetGenerator, UnetGenerator
-from .sr_backbones import (EDSR, SRCNN, BasicVSRNet, EDVRNet, IconVSR,
+from .sr_backbones import (EDSR, RDN, SRCNN, BasicVSRNet, EDVRNet, IconVSR,
                            MSRResNet, RRDBNet, TOFlow)
 
 __all__ = [
@@ -21,7 +21,7 @@
     'PConvEncoderDecoder', 'PConvEncoder', 'PConvDecoder', 'ResNetEnc',
     'ResNetDec', 'ResShortcutEnc', 'ResShortcutDec', 'RRDBNet',
     'DeepFillEncoder', 'HolisticIndexBlock', 'DepthwiseIndexBlock',
-    'ContextualAttentionNeck', 'DeepFillDecoder', 'EDSR',
+    'ContextualAttentionNeck', 'DeepFillDecoder', 'EDSR', 'RDN',
     'DeepFillEncoderDecoder', 'EDVRNet', 'IndexedUpsample', 'IndexNetEncoder',
     'IndexNetDecoder', 'TOFlow', 'ResGCAEncoder', 'ResGCADecoder', 'SRCNN',
     'UnetGenerator', 'ResnetGenerator', 'FBAResnetDilated', 'FBADecoder',
diff --git a/mmedit/models/backbones/sr_backbones/__init__.py b/mmedit/models/backbones/sr_backbones/__init__.py
index 22b15d41ba..d96a81a9ca 100644
--- a/mmedit/models/backbones/sr_backbones/__init__.py
+++ b/mmedit/models/backbones/sr_backbones/__init__.py
@@ -2,6 +2,7 @@
 from .edsr import EDSR
 from .edvr_net import EDVRNet
 from .iconvsr import IconVSR
+from .rdn import RDN
 from .rrdb_net import RRDBNet
 from .sr_resnet import MSRResNet
 from .srcnn import SRCNN
@@ -9,5 +10,5 @@
 
 __all__ = [
     'MSRResNet', 'RRDBNet', 'EDSR', 'EDVRNet', 'TOFlow', 'SRCNN',
-    'BasicVSRNet', 'IconVSR'
+    'BasicVSRNet', 'IconVSR', 'RDN'
 ]
diff --git a/mmedit/models/backbones/sr_backbones/rdn.py b/mmedit/models/backbones/sr_backbones/rdn.py
new file mode 100644
index 0000000000..b0d643fe2b
--- /dev/null
+++ b/mmedit/models/backbones/sr_backbones/rdn.py
@@ -0,0 +1,200 @@
+import torch
+from mmcv.runner import load_checkpoint
+from torch import nn
+
+from mmedit.models.registry import BACKBONES
+from mmedit.utils import get_root_logger
+
+
+class DenseLayer(nn.Module):
+    """Dense layer
+
+    Args:
+        in_channels (int): Channel number of inputs.
+        out_channels (int): Channel number of outputs.
+
+    """
+
+    def __init__(self, in_channels, out_channels):
+        super().__init__()
+        self.conv = nn.Conv2d(
+            in_channels, out_channels, kernel_size=3, padding=3 // 2)
+        self.relu = nn.ReLU(inplace=True)
+
+    def forward(self, x):
+        """Forward function.
+
+        Args:
+            x (Tensor): Input tensor with shape (n, c_in, h, w).
+
+        Returns:
+            Tensor: Forward results, tensor with shape (n, c_in+c_out, h, w).
+        """
+        return torch.cat([x, self.relu(self.conv(x))], 1)
+
+
+class RDB(nn.Module):
+    """Residual Dense Block of Residual Dense Network
+
+    Args:
+        in_channels (int): Channel number of inputs.
+        channel_growth (int): Channels growth in each layer.
+        num_layers (int): Layer number in the Residual Dense Block.
+    """
+
+    def __init__(self, in_channels, channel_growth, num_layers):
+        super().__init__()
+        self.layers = nn.Sequential(*[
+            DenseLayer(in_channels + channel_growth * i, channel_growth)
+            for i in range(num_layers)
+        ])
+
+        # local feature fusion
+        self.lff = nn.Conv2d(
+            in_channels + channel_growth * num_layers,
+            channel_growth,
+            kernel_size=1)
+
+    def forward(self, x):
+        """Forward function.
+
+        Args:
+            x (Tensor): Input tensor with shape (n, c, h, w).
+
+        Returns:
+            Tensor: Forward results.
+        """
+        return x + self.lff(self.layers(x))  # local residual learning
+
+
+@BACKBONES.register_module()
+class RDN(nn.Module):
+    """RDN model for single image super-resolution.
+
+    Paper: Residual Dense Network for Image Super-Resolution
+
+    Adapted from 'https://github.com/yjn870/RDN-pytorch.git'
+    'RDN-pytorch/blob/master/models.py'
+    Copyright (c) 2021, JaeYun Yeo, under MIT License.
+
+    Args:
+        in_channels (int): Channel number of inputs.
+        out_channels (int): Channel number of outputs.
+        mid_channels (int): Channel number of intermediate features.
+            Default: 64.
+        num_blocks (int): Block number in the trunk network. Default: 16.
+        upscale_factor (int): Upsampling factor. Support 2^n and 3.
+            Default: 4.
+        num_layer (int): Layer number in the Residual Dense Block.
+            Default: 8.
+        channel_growth(int): Channels growth in each layer of RDB.
+            Default: 64.
+    """
+
+    def __init__(self,
+                 in_channels,
+                 out_channels,
+                 mid_channels=64,
+                 num_blocks=16,
+                 upscale_factor=4,
+                 num_layers=8,
+                 channel_growth=64):
+
+        super().__init__()
+        self.mid_channels = mid_channels
+        self.channel_growth = channel_growth
+        self.num_blocks = num_blocks
+        self.num_layers = num_layers
+
+        # shallow feature extraction
+        self.sfe1 = nn.Conv2d(
+            in_channels, mid_channels, kernel_size=3, padding=3 // 2)
+        self.sfe2 = nn.Conv2d(
+            mid_channels, mid_channels, kernel_size=3, padding=3 // 2)
+
+        # residual dense blocks
+        self.rdbs = nn.ModuleList(
+            [RDB(self.mid_channels, self.channel_growth, self.num_layers)])
+        for _ in range(self.num_blocks - 1):
+            self.rdbs.append(
+                RDB(self.channel_growth, self.channel_growth, self.num_layers))
+
+        # global feature fusion
+        self.gff = nn.Sequential(
+            nn.Conv2d(
+                self.channel_growth * self.num_blocks,
+                self.mid_channels,
+                kernel_size=1),
+            nn.Conv2d(
+                self.mid_channels,
+                self.mid_channels,
+                kernel_size=3,
+                padding=3 // 2))
+
+        # up-sampling
+        assert 2 <= upscale_factor <= 4
+        if upscale_factor == 2 or upscale_factor == 4:
+            self.upscale = []
+            for _ in range(upscale_factor // 2):
+                self.upscale.extend([
+                    nn.Conv2d(
+                        self.mid_channels,
+                        self.mid_channels * (2**2),
+                        kernel_size=3,
+                        padding=3 // 2),
+                    nn.PixelShuffle(2)
+                ])
+            self.upscale = nn.Sequential(*self.upscale)
+        else:
+            self.upscale = nn.Sequential(
+                nn.Conv2d(
+                    self.mid_channels,
+                    self.mid_channels * (upscale_factor**2),
+                    kernel_size=3,
+                    padding=3 // 2), nn.PixelShuffle(upscale_factor))
+
+        self.output = nn.Conv2d(
+            self.mid_channels, out_channels, kernel_size=3, padding=3 // 2)
+
+    def forward(self, x):
+        """Forward function.
+
+        Args:
+            x (Tensor): Input tensor with shape (n, c, h, w).
+
+        Returns:
+            Tensor: Forward results.
+        """
+
+        sfe1 = self.sfe1(x)
+        sfe2 = self.sfe2(sfe1)
+
+        x = sfe2
+        local_features = []
+        for i in range(self.num_blocks):
+            x = self.rdbs[i](x)
+            local_features.append(x)
+
+        x = self.gff(torch.cat(local_features, 1)) + sfe1
+        # global residual learning
+        x = self.upscale(x)
+        x = self.output(x)
+        return x
+
+    def init_weights(self, pretrained=None, strict=True):
+        """Init weights for models.
+
+        Args:
+            pretrained (str, optional): Path for pretrained weights. If given
+                None, pretrained weights will not be loaded. Defaults to None.
+            strict (boo, optional): Whether strictly load the pretrained model.
+                Defaults to True.
+        """
+        if isinstance(pretrained, str):
+            logger = get_root_logger()
+            load_checkpoint(self, pretrained, strict=strict, logger=logger)
+        elif pretrained is None:
+            pass  # use default initialization
+        else:
+            raise TypeError('"pretrained" must be a str or None. '
+                            f'But received {type(pretrained)}.')
diff --git a/tests/test_rdn.py b/tests/test_rdn.py
new file mode 100644
index 0000000000..ccf07fa9c0
--- /dev/null
+++ b/tests/test_rdn.py
@@ -0,0 +1,56 @@
+import torch
+import torch.nn as nn
+
+from mmedit.models import build_backbone
+
+
+def test_rdn():
+
+    scale = 4
+
+    model_cfg = dict(
+        type='RDN',
+        in_channels=3,
+        out_channels=3,
+        mid_channels=64,
+        num_blocks=16,
+        upscale_factor=scale)
+
+    # build model
+    model = build_backbone(model_cfg)
+
+    # test attributes
+    assert model.__class__.__name__ == 'RDN'
+
+    # prepare data
+    inputs = torch.rand(1, 3, 32, 16)
+    targets = torch.rand(1, 3, 128, 64)
+
+    # prepare loss
+    loss_function = nn.L1Loss()
+
+    # prepare optimizer
+    optimizer = torch.optim.Adam(model.parameters())
+
+    # test on cpu
+    output = model(inputs)
+    optimizer.zero_grad()
+    loss = loss_function(output, targets)
+    loss.backward()
+    optimizer.step()
+    assert torch.is_tensor(output)
+    assert output.shape == targets.shape
+
+    # test on gpu
+    if torch.cuda.is_available():
+        model = model.cuda()
+        optimizer = torch.optim.Adam(model.parameters())
+        inputs = inputs.cuda()
+        targets = targets.cuda()
+        output = model(inputs)
+        optimizer.zero_grad()
+        loss = loss_function(output, targets)
+        loss.backward()
+        optimizer.step()
+        assert torch.is_tensor(output)
+        assert output.shape == targets.shape