Add dataset loading compatible with finetuning folder structure

2023-08-27 23:27:41 -03:00 · 2023-08-27 23:27:41 -03:00 · 5a278993e4
parent 07fbb2b72a
commit 5a278993e4
1 changed files with 220 additions and 0 deletions
--- a/KAIR/data/dataset_deeptempest_finetuning.py
+++ b/KAIR/data/dataset_deeptempest_finetuning.py
@ -0,0 +1,220 @@
+import os
+import random
+import numpy as np
+import torch
+import torch.utils.data as data
+import utils.utils_image as util
+from utils.DTutils import is_natural_patch
+import itertools
+
+
+class DatasetFFDNet(data.Dataset):
+    """
+    # -----------------------------------------
+    # Get L/H/M for denosing on AWGN with a range of sigma.
+    # Only dataroot_H is needed.
+    # -----------------------------------------
+    # e.g., FFDNet, H = f(L, sigma), sigma is noise level
+    # -----------------------------------------
+    """
+
+    def __init__(self, opt):
+        super(DatasetFFDNet, self).__init__()
+        self.opt = opt
+        self.n_channels = opt['n_channels'] if opt['n_channels'] else 3
+        self.n_channels_datasetload = opt['n_channels_datasetload'] if opt['n_channels_datasetload'] else 3
+        self.patch_size = self.opt['H_size'] if opt['H_size'] else 64
+        self.sigma = opt['sigma'] if opt['sigma'] else [0, 75]
+        self.sigma_min, self.sigma_max = self.sigma[0], self.sigma[1]
+        self.sigma_test = opt['sigma_test'] if opt['sigma_test']  else 0
+        self.use_all_patches = opt['use_all_patches'] if opt['use_all_patches'] else False
+        self.num_patches_per_image = opt['num_patches_per_image'] if opt['num_patches_per_image'] else 100
+        self.skip_natural_patches = opt['skip_natural_patches'] if opt['skip_natural_patches'] else False
+
+        # -------------------------------------
+        # Dataset path contains all H images and subfolders for every single one with one or more
+        # -------------------------------------
+
+        """  
+        Dataset path includes all H images and L-subfolders.
+        Every H image has one L-subfolder assosiated, which
+        contains one or more L representations of the H image.
+        """
+
+
+        self.paths_H = [f for f in os.listdir(opt['dataroot_H']) if os.path.isfile(f)]
+        #------------------------------------------------------------------------------------------------------
+        # For the above step one can use util.get_image_paths(), but it goes recursevely thought the tree dirs
+        #------------------------------------------------------------------------------------------------------
+
+        paths_H_aux = []
+        self.paths_L = []
+
+        # Iterate over all image paths
+        for H_file in self.paths_H:
+            # filename = os.path.basename(H_file)
+            filename = H_file.split(".png") # TODO: the correct way to do it is with os.path.basename()
+            L_folder = os.path.join(opt['dataroot_H'],filename)
+            # For image at subfolder, append to L paths and repeat current H path
+            for L_file in os.listdir(L_folder):
+                L_filepath = os.path.join(L_folder,L_file)
+                paths_H_aux.append(H_file)
+                self.paths_L.append(L_filepath)
+
+        # Update H paths
+        self.paths_H = paths_H_aux
+        
+        # Repeat every image in path list to get more than one patch per image
+        if self.opt['phase'] == 'train':
+            listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_H]
+            self.paths_H = list(itertools.chain.from_iterable(listOfLists))
+
+            listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_L]
+            self.paths_L = list(itertools.chain.from_iterable(listOfLists))
+
+    def __getitem__(self, index):
+
+        # -------------------------------------
+        # get H and L image
+        # -------------------------------------
+        H_path = self.paths_H[index]
+        L_path = self.paths_L[index]
+
+        H_file, L_file = H_path.split('/')[-1], L_path.split('/')[-1]
+        H_name, L_name = H_file.split('.')[0], L_file.split('.')[0]
+        
+        assert H_name==L_name, f'Both high and low quality images MUST have same name.\nGot {H_name} and {L_name} respectively.'
+
+        img_H = util.imread_uint(H_path, self.n_channels_datasetload)       
+
+        
+        img_L = util.imread_uint(L_path, self.n_channels_datasetload)[:,:,:2]       
+
+        # Temp solution for blanking images
+        L_v, L_h = img_L.shape[:2]
+
+        if L_v==1000 and L_h==1800:
+          img_L  = img_L[(1000-900)//2:-(1000-900)//2,(1800-1600)//2:-(1800-1600)//2,:]
+
+        # Get module of complex image, stretch and to uint8
+        # img_L = img_L.astype('float')
+        # img_L = np.abs(img_L[:,:,0]+1j*img_L[:,:,1])
+        # img_L = 255*(img_L - img_L.min())/(img_L.max() - img_L.min())
+        # img_L = img_L.astype('uint8')
+
+        if self.opt['phase'] == 'train':
+            """
+            # --------------------------------
+            # get L/H/M patch pairs
+            # --------------------------------
+            """
+            H, W = img_H.shape[:2]
+
+            if self.use_all_patches or (img_H.shape[0] <= self.patch_size) or (img_H.shape[1] <= self.patch_size):
+
+                # ---------------------------------
+                # Start or continue image patching
+                # ---------------------------------                
+                img_patch_index = index % self.num_patches_per_image  # Resets to 0 every time index overflows num_patches
+                
+                # Upper-left corner of patch
+                h_index = self.patch_size * ( (img_patch_index * self.patch_size) // W)
+                w_index =  self.patch_size * ( ( (img_patch_index * self.patch_size) % W ) // self.patch_size)
+
+                # Dont exceed the image limit
+                h_index = min(h_index, H - self.patch_size)
+                w_index = min(w_index, W - self.patch_size)
+
+                ### Keep text patches only (non-natural images)
+                if self.skip_natural_patches:
+
+                    # Check if selected patch is natural, based on RGB entropy
+                    is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])
+
+                    # If natural, select random patch and keep trying until non-natural or reaching max attempts
+                    attempt = 0
+                    max_attempts = 10
+                    while is_natural and (attempt < max_attempts):
+                        h_index = random.randint(0, max(0, H - self.patch_size))
+                        w_index = random.randint(0, max(0, W - self.patch_size))
+                        is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])
+                        attempt += 1
+
+
+            else:
+                # ---------------------------------
+                # randomly crop the patch
+                # ---------------------------------
+                h_index = random.randint(0, max(0, H - self.patch_size))
+                w_index = random.randint(0, max(0, W - self.patch_size))
+
+            # Ground-truth as channels mean
+            patch_H = np.mean(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :],axis=2)
+            
+            # Get the patch from the simulation
+            patch_L = img_L[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size,:]
+
+            # ---------------------------------
+            # HWC to CHW, numpy(uint) to tensor
+            # ---------------------------------
+            img_H = util.uint2tensor3(patch_H)
+            img_L = util.uint2tensor3(patch_L)
+
+            # ---------------------------------
+            # get noise level
+            # ---------------------------------
+            noise_level = torch.FloatTensor([int(np.random.uniform(self.sigma_min, self.sigma_max))])/255.0
+            # noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0
+            if (self.sigma_max != 0):
+                # ---------------------------------
+                # add noise
+                # ---------------------------------
+                noise = torch.randn(img_L.size()).mul_(noise_level).float()
+                img_L.add_(noise)
+
+        else:
+            """
+            # --------------------------------
+            # get L/H/sigma image pairs
+            # --------------------------------
+            """
+
+            # Ground-truth as mean value of RGB channels
+            img_H = np.mean(img_H,axis=2)
+            img_H = img_H[:,:,np.newaxis]
+
+            # ---------------------------------
+            # HWC to CHW, numpy(uint) to tensor
+            # ---------------------------------
+            img_H = util.uint2tensor3(img_H)
+            img_L = util.uint2tensor3(img_L)
+
+            # img_H = util.uint2single(img_H)
+
+            # img_L = util.uint2single(img_L)
+
+            
+            # ---------------------------------
+            # get noise level
+            # ---------------------------------
+
+            noise_level = torch.FloatTensor([int(self.sigma_test)])/255.0
+            if self.sigma_test != 0:
+
+                # noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0
+            
+                # ---------------------------------
+                # add noise
+                # ---------------------------------
+                noise = torch.randn(img_L.size()).mul_(noise_level).float()
+                img_L.add_(noise)
+
+
+
+        noise_level = noise_level.unsqueeze(1).unsqueeze(1)
+
+
+        return {'L': img_L, 'H': img_H, 'C': noise_level, 'L_path': L_path, 'H_path': H_path}
+
+    def __len__(self):
+        return len(self.paths_H)