fangvv
diff --git a/‎README.md
Lines changed: 48 additions & 0 deletions b/‎README.md
Lines changed: 48 additions & 0 deletions
diff --git a/‎codes/data/LQGT_classify_test.py
Lines changed: 127 additions & 0 deletions b/‎codes/data/LQGT_classify_test.py
Lines changed: 127 additions & 0 deletions
diff --git a/‎codes/data/LQGT_dataset.py
Lines changed: 132 additions & 0 deletions b/‎codes/data/LQGT_dataset.py
Lines changed: 132 additions & 0 deletions
@@ -0,0 +1,48 @@
+## CDNSR
+
+This is the source code for our paper: Classification-based Dynamic Network for Efficient Super-Resolution. A brief introduction of this work is as follows:
+
+> Deep neural networks (DNNs) based approaches have achieved superior performance in single image super-resolution (SR). To obtain better visual quality, DNNs for SR are generally designed with massive computation overhead. To accelerate network inference under resource constraints, we propose a classification-based dynamic network for efficient super-resolution (CDNSR), which combines the classification and SR networks in a unified framework. Specifically, CDNSR decomposes a large image into a number of image-patches, and uses a classification network to categorize them into different classes based on the restoration difficulty. Each class of image-patches will be handled by the SR network that corresponds to the difficulty of this class. In particular, we design a new loss to trade off between the computational overhead and the reconstruction quality. Besides, we apply contrastive learning based knowledge distillation to guarantee the performance of SR networks and the quality of reconstructed images. Extensive experiments show that CDNSR significantly outperforms the other SR networks and backbones on image quality and computational overhead.
+
+This paper has been accepted by ICASSP 2023. Due to the 5-page limitation of this conference, we provide a full version of technique report in this repo.
+
+## Required software
+
+PyTorch
+
+## Pre-train & test SR-Nets
+`train`
+```python
+cd codes
+python train_SR_Net.py -opt options/train/train_CARN_branch1.yml
+python train_SR_Net.py -opt options/train/train_CARN_branch2.yml
+python train_SR_Net.py -opt options/train/train_CARN_branch3.yml
+```
+`test`
+```
+cd codes
+python test_SR_Net.py -opt options/test/test_CARN.yml
+```
+
+## Train & test CDNSR
+`train`
+```
+cd codes
+python train_CDNSR.py -opt options/train/train_CDNSR_CARN.yml
+
+```
+`distill`
+```
+cd codes
+python train_CDNSR.py -opt options/train/train_CDNSR_CARN_KD.yml
+```
+
+`test`
+```
+cd codes
+python test_CDNSR.py -opt options/test/test_CDNSR_CARN.yml
+```
+
+## Contact
+
+Qi Wang ([email protected])
@@ -0,0 +1,127 @@
+import random
+import numpy as np
+import cv2
+import lmdb
+import torch
+import torch.utils.data as data
+import data.util as util
+
+
+class LQGTDataset(data.Dataset):
+    """
+    Read LQ (Low Quality, e.g. LR (Low Resolution), blurry, etc) and GT image pairs.
+    If only GT images are provided, generate LQ images on-the-fly.
+    """
+
+    def __init__(self, opt):
+        super(LQGTDataset, self).__init__()
+        self.opt = opt
+        self.data_type = self.opt['data_type']
+        self.paths_LQ, self.paths_GT = None, None
+        self.sizes_LQ, self.sizes_GT = None, None
+        self.LQ_env, self.GT_env = None, None  # environments for lmdb
+
+        self.paths_GT, self.sizes_GT = util.get_image_paths(self.data_type, opt['dataroot_GT'])
+        self.paths_LQ, self.sizes_LQ = util.get_image_paths(self.data_type, opt['dataroot_LQ'])
+        assert self.paths_GT, 'Error: GT path is empty.'
+        if self.paths_LQ and self.paths_GT:
+            assert len(self.paths_LQ) == len(
+                self.paths_GT
+            ), 'GT and LQ datasets have different number of images - {}, {}.'.format(
+                len(self.paths_LQ), len(self.paths_GT))
+        self.random_scale_list = [1]
+
+    def _init_lmdb(self):
+        # https://github.com/chainer/chainermn/issues/129
+        self.GT_env = lmdb.open(self.opt['dataroot_GT'], readonly=True, lock=False, readahead=False,
+                                meminit=False)
+        self.LQ_env = lmdb.open(self.opt['dataroot_LQ'], readonly=True, lock=False, readahead=False,
+                                meminit=False)
+
+    def __getitem__(self, index):
+        if self.data_type == 'lmdb' and (self.GT_env is None or self.LQ_env is None):
+            self._init_lmdb()
+        GT_path, LQ_path = None, None
+        scale = self.opt['scale']
+        GT_size = self.opt['GT_size']
+
+        # get GT image
+        GT_path = self.paths_GT[index]
+        resolution = [int(s) for s in self.sizes_GT[index].split('_')
+                      ] if self.data_type == 'lmdb' else None
+        img_GT = util.read_img(self.GT_env, GT_path, resolution)
+        if self.opt['phase'] != 'train':  # modcrop in the validation / test phase
+            img_GT = util.modcrop(img_GT, scale)
+        if self.opt['color']:  # change color space if necessary
+            img_GT = util.channel_convert(img_GT.shape[2], self.opt['color'], [img_GT])[0]
+
+        # get LQ image
+        if self.paths_LQ:
+            LQ_path = self.paths_LQ[index]
+            resolution = [int(s) for s in self.sizes_LQ[index].split('_')
+                          ] if self.data_type == 'lmdb' else None
+            img_LQ = util.read_img(self.LQ_env, LQ_path, resolution)
+        else:  # down-sampling on-the-fly
+            # randomly scale during training
+            if self.opt['phase'] == 'train':
+                random_scale = random.choice(self.random_scale_list)
+                H_s, W_s, _ = img_GT.shape
+
+                def _mod(n, random_scale, scale, thres):
+                    rlt = int(n * random_scale)
+                    rlt = (rlt // scale) * scale
+                    return thres if rlt < thres else rlt
+
+                H_s = _mod(H_s, random_scale, scale, GT_size)
+                W_s = _mod(W_s, random_scale, scale, GT_size)
+                img_GT = cv2.resize(img_GT, (W_s, H_s), interpolation=cv2.INTER_LINEAR)
+                if img_GT.ndim == 2:
+                    img_GT = cv2.cvtColor(img_GT, cv2.COLOR_GRAY2BGR)
+
+            H, W, _ = img_GT.shape
+            # using matlab imresize
+            img_LQ = util.imresize_np(img_GT, 1 / scale, True)
+            if img_LQ.ndim == 2:
+                img_LQ = np.expand_dims(img_LQ, axis=2)
+
+        if self.opt['phase'] == 'train':
+            # if the image size is too small
+            H, W, _ = img_GT.shape
+            if H < GT_size or W < GT_size:
+                img_GT = cv2.resize(img_GT, (GT_size, GT_size), interpolation=cv2.INTER_LINEAR)
+                # using matlab imresize
+                img_LQ = util.imresize_np(img_GT, 1 / scale, True)
+                if img_LQ.ndim == 2:
+                    img_LQ = np.expand_dims(img_LQ, axis=2)
+
+            H, W, C = img_LQ.shape
+            LQ_size = GT_size // scale
+
+            # randomly crop
+            rnd_h = random.randint(0, max(0, H - LQ_size))
+            rnd_w = random.randint(0, max(0, W - LQ_size))
+            img_LQ = img_LQ[rnd_h:rnd_h + LQ_size, rnd_w:rnd_w + LQ_size, :]
+            rnd_h_GT, rnd_w_GT = int(rnd_h * scale), int(rnd_w * scale)
+            img_GT = img_GT[rnd_h_GT:rnd_h_GT + GT_size, rnd_w_GT:rnd_w_GT + GT_size, :]
+
+            # augmentation - flip, rotate
+            img_LQ, img_GT = util.augment([img_LQ, img_GT], self.opt['use_flip'],
+                                          self.opt['use_rot'])
+
+        if self.opt['color']:  # change color space if necessary
+            img_LQ = util.channel_convert(C, self.opt['color'],
+                                          [img_LQ])[0]  # TODO during val no definition
+
+        # BGR to RGB, HWC to CHW, numpy to tensor
+        if img_GT.shape[2] == 3:
+            img_GT = img_GT[:, :, [2, 1, 0]]
+            img_LQ = img_LQ[:, :, [2, 1, 0]]
+        img_GT = torch.from_numpy(np.ascontiguousarray(np.transpose(img_GT, (2, 0, 1)))).float()
+        img_LQ = torch.from_numpy(np.ascontiguousarray(np.transpose(img_LQ, (2, 0, 1)))).float()
+
+        if LQ_path is None:
+            LQ_path = GT_path
+        return {'LQ': img_LQ, 'GT': img_GT, 'LQ_path': LQ_path, 'GT_path': GT_path}
+
+    def __len__(self):
+        return len(self.paths_GT)
@@ -0,0 +1,132 @@
+import random
+import numpy as np
+import cv2
+import lmdb
+import torch
+import torch.utils.data as data
+import data.util as util
+
+
+class LQGTDataset(data.Dataset):
+    """
+    Read LQ (Low Quality, e.g. LR (Low Resolution), blurry, etc) and GT image pairs.
+    If only GT images are provided, generate LQ images on-the-fly.
+    """
+
+    def __init__(self, opt):
+        super(LQGTDataset, self).__init__()
+        self.opt = opt
+        self.data_type = self.opt['data_type']
+        self.paths_LQ, self.paths_GT = None, None
+        self.sizes_LQ, self.sizes_GT = None, None
+        self.LQ_env, self.GT_env = None, None  # environments for lmdb
+
+        self.paths_GT, self.sizes_GT = util.get_image_paths(self.data_type, opt['dataroot_GT'])
+        self.paths_LQ, self.sizes_LQ = util.get_image_paths(self.data_type, opt['dataroot_LQ'])
+
+        # self.paths_GT=[self.paths_GT[400000],self.paths_GT[800000],self.paths_GT[1200000]]
+        # self.paths_LQ=[self.paths_LQ[400000],self.paths_LQ[800000],self.paths_LQ[1200000]]
+
+
+        assert self.paths_GT, 'Error: GT path is empty.'
+        if self.paths_LQ and self.paths_GT:
+            assert len(self.paths_LQ) == len(
+                self.paths_GT
+            ), 'GT and LQ datasets have different number of images - {}, {}.'.format(
+                len(self.paths_LQ), len(self.paths_GT))
+        self.random_scale_list = [1]
+
+    def _init_lmdb(self):
+        # https://github.com/chainer/chainermn/issues/129
+        self.GT_env = lmdb.open(self.opt['dataroot_GT'], readonly=True, lock=False, readahead=False,
+                                meminit=False)
+        self.LQ_env = lmdb.open(self.opt['dataroot_LQ'], readonly=True, lock=False, readahead=False,
+                                meminit=False)
+
+    def __getitem__(self, index):
+        if self.data_type == 'lmdb' and (self.GT_env is None or self.LQ_env is None):
+            self._init_lmdb()
+        GT_path, LQ_path = None, None
+        scale = self.opt['scale']
+        GT_size = self.opt['GT_size']
+
+        # get GT image
+        GT_path = self.paths_GT[index]
+        resolution = [int(s) for s in self.sizes_GT[index].split('_')
+                      ] if self.data_type == 'lmdb' else None
+        img_GT = util.read_img(self.GT_env, GT_path, resolution)
+        if self.opt['phase'] != 'train':  # modcrop in the validation / test phase
+            img_GT = util.modcrop(img_GT, scale)
+        if self.opt['color']:  # change color space if necessary
+            img_GT = util.channel_convert(img_GT.shape[2], self.opt['color'], [img_GT])[0]
+
+        # get LQ image
+        if self.paths_LQ:
+            LQ_path = self.paths_LQ[index]
+            resolution = [int(s) for s in self.sizes_LQ[index].split('_')
+                          ] if self.data_type == 'lmdb' else None
+            img_LQ = util.read_img(self.LQ_env, LQ_path, resolution)
+        else:  # down-sampling on-the-fly
+            # randomly scale during training
+            if self.opt['phase'] == 'train':
+                random_scale = random.choice(self.random_scale_list)
+                H_s, W_s, _ = img_GT.shape
+
+                def _mod(n, random_scale, scale, thres):
+                    rlt = int(n * random_scale)
+                    rlt = (rlt // scale) * scale
+                    return thres if rlt < thres else rlt
+
+                H_s = _mod(H_s, random_scale, scale, GT_size)
+                W_s = _mod(W_s, random_scale, scale, GT_size)
+                img_GT = cv2.resize(img_GT, (W_s, H_s), interpolation=cv2.INTER_LINEAR)
+                if img_GT.ndim == 2:
+                    img_GT = cv2.cvtColor(img_GT, cv2.COLOR_GRAY2BGR)
+
+            H, W, _ = img_GT.shape
+            # using matlab imresize
+            img_LQ = util.imresize_np(img_GT, 1 / scale, True)
+            if img_LQ.ndim == 2:
+                img_LQ = np.expand_dims(img_LQ, axis=2)
+
+        if self.opt['phase'] == 'train':
+            # if the image size is too small
+            H, W, _ = img_GT.shape
+            if H < GT_size or W < GT_size:
+                img_GT = cv2.resize(img_GT, (GT_size, GT_size), interpolation=cv2.INTER_LINEAR)
+                # using matlab imresize
+                img_LQ = util.imresize_np(img_GT, 1 / scale, True)
+                if img_LQ.ndim == 2:
+                    img_LQ = np.expand_dims(img_LQ, axis=2)
+
+            H, W, C = img_LQ.shape
+            LQ_size = GT_size // scale
+
+            # randomly crop
+            rnd_h = random.randint(0, max(0, H - LQ_size))
+            rnd_w = random.randint(0, max(0, W - LQ_size))
+            img_LQ = img_LQ[rnd_h:rnd_h + LQ_size, rnd_w:rnd_w + LQ_size, :]
+            rnd_h_GT, rnd_w_GT = int(rnd_h * scale), int(rnd_w * scale)
+            img_GT = img_GT[rnd_h_GT:rnd_h_GT + GT_size, rnd_w_GT:rnd_w_GT + GT_size, :]
+
+            # augmentation - flip, rotate
+            img_LQ, img_GT = util.augment([img_LQ, img_GT], self.opt['use_flip'],
+                                          self.opt['use_rot'])
+
+        if self.opt['color']:  # change color space if necessary
+            img_LQ = util.channel_convert(C, self.opt['color'],
+                                          [img_LQ])[0]  # TODO during val no definition
+
+        # BGR to RGB, HWC to CHW, numpy to tensor
+        if img_GT.shape[2] == 3:
+            img_GT = img_GT[:, :, [2, 1, 0]]
+            img_LQ = img_LQ[:, :, [2, 1, 0]]
+        img_GT = torch.from_numpy(np.ascontiguousarray(np.transpose(img_GT, (2, 0, 1)))).float()
+        img_LQ = torch.from_numpy(np.ascontiguousarray(np.transpose(img_LQ, (2, 0, 1)))).float()
+
+        if LQ_path is None:
+            LQ_path = GT_path
+        return {'LQ': img_LQ, 'GT': img_GT, 'LQ_path': LQ_path, 'GT_path': GT_path}
+
+    def __len__(self):
+        return len(self.paths_GT)