deep-tempest/end-to-end/data/dataset_ffdnet.py

import random
import numpy as np
import torch
import torch.utils.data as data
import utils.utils_image as util
from utils.DTutils import is_natural_patch
import itertools


class DatasetFFDNet(data.Dataset):
    """
    # -----------------------------------------
    # Get L/H/M for denosing on AWGN with a range of sigma.
    # Only dataroot_H is needed.
    # -----------------------------------------
    # e.g., FFDNet, H = f(L, sigma), sigma is noise level
    # -----------------------------------------
    """

    def __init__(self, opt):
        super(DatasetFFDNet, self).__init__()
        self.opt = opt
        self.n_channels = opt['n_channels'] if opt['n_channels'] else 3
        self.n_channels_datasetload = opt['n_channels_datasetload'] if opt['n_channels_datasetload'] else 3
        self.patch_size = self.opt['H_size'] if opt['H_size'] else 64
        self.sigma = opt['sigma'] if opt['sigma'] else [0, 75]
        self.sigma_min, self.sigma_max = self.sigma[0], self.sigma[1]
        self.sigma_test = opt['sigma_test'] if opt['sigma_test']  else 0
        self.use_all_patches = opt['use_all_patches'] if opt['use_all_patches'] else False
        self.num_patches_per_image = opt['num_patches_per_image'] if opt['num_patches_per_image'] else 100
        # self.num_patches_per_image = opt['num_patches_per_image'] if not(self.use_all_patches) else ((1280**2)//(self.patch_size)**2)    ### HARDCODED
        self.skip_natural_patches = opt['skip_natural_patches'] if opt['skip_natural_patches'] else False

        # -------------------------------------
        # get the path of H, return None if input is None
        # -------------------------------------
        self.paths_H = util.get_image_paths(opt['dataroot_H'])
        self.paths_L = util.get_image_paths(opt['dataroot_L'])

        # Repeat every image in path list to get more than one patch per image
        if self.opt['phase'] == 'train':
            listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_H]
            self.paths_H = list(itertools.chain.from_iterable(listOfLists))

            listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_L]
            self.paths_L = list(itertools.chain.from_iterable(listOfLists))

    def __getitem__(self, index):

        # -------------------------------------
        # get H and L image
        # -------------------------------------
        H_path = self.paths_H[index]
        L_path = self.paths_L[index]

        H_file, L_file = H_path.split('/')[-1], L_path.split('/')[-1]
        H_name, L_name = H_file.split('.')[0], L_file.split('.')[0]
        
        assert H_name==L_name, f'Both high and low quality images MUST have same name.\nGot {H_name} and {L_name} respectively.'

        img_H = util.imread_uint(H_path, self.n_channels_datasetload)       

        
        img_L = util.imread_uint(L_path, self.n_channels_datasetload)[:,:,:2]       

        # Temp solution for blanking images
        L_v, L_h = img_L.shape[:2]

        if L_v==1000 and L_h==1800:
          img_L  = img_L[(1000-900)//2:-(1000-900)//2,(1800-1600)//2:-(1800-1600)//2,:]

        # Get module of complex image, stretch and to uint8
        # img_L = img_L.astype('float')
        # img_L = np.abs(img_L[:,:,0]+1j*img_L[:,:,1])
        # img_L = 255*(img_L - img_L.min())/(img_L.max() - img_L.min())
        # img_L = img_L.astype('uint8')

        if self.opt['phase'] == 'train':
            """
            # --------------------------------
            # get L/H/M patch pairs
            # --------------------------------
            """
            H, W = img_H.shape[:2]

            if self.use_all_patches or (img_H.shape[0] <= self.patch_size) or (img_H.shape[1] <= self.patch_size):

                # ---------------------------------
                # Start or continue image patching
                # ---------------------------------                
                img_patch_index = index % self.num_patches_per_image  # Resets to 0 every time index overflows num_patches
                
                # Upper-left corner of patch
                h_index = self.patch_size * ( (img_patch_index * self.patch_size) // W)
                w_index =  self.patch_size * ( ( (img_patch_index * self.patch_size) % W ) // self.patch_size)

                # Dont exceed the image limit
                h_index = min(h_index, H - self.patch_size)
                w_index = min(w_index, W - self.patch_size)

                ### Keep text patches only (non-natural images)
                if self.skip_natural_patches:

                    # Check if selected patch is natural, based on RGB entropy
                    is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])

                    # If natural, select random patch and keep trying until non-natural or reaching max attempts
                    attempt = 0
                    max_attempts = 10
                    while is_natural and (attempt < max_attempts):
                        h_index = random.randint(0, max(0, H - self.patch_size))
                        w_index = random.randint(0, max(0, W - self.patch_size))
                        is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])
                        attempt += 1


            else:
                # ---------------------------------
                # randomly crop the patch
                # ---------------------------------
                h_index = random.randint(0, max(0, H - self.patch_size))
                w_index = random.randint(0, max(0, W - self.patch_size))

            # Ground-truth as channels mean
            patch_H = np.mean(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :],axis=2)
            
            # Get the patch from the simulation
            patch_L = img_L[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size,:]

            # ---------------------------------
            # HWC to CHW, numpy(uint) to tensor
            # ---------------------------------
            img_H = util.uint2tensor3(patch_H)
            img_L = util.uint2tensor3(patch_L)

            # ---------------------------------
            # get noise level
            # ---------------------------------
            noise_level = torch.FloatTensor([int(np.random.uniform(self.sigma_min, self.sigma_max))])/255.0
            # noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0
            if (self.sigma_max != 0):
                # ---------------------------------
                # add noise
                # ---------------------------------
                noise = torch.randn(img_L.size()).mul_(noise_level).float()
                img_L.add_(noise)

        else:
            """
            # --------------------------------
            # get L/H/sigma image pairs
            # --------------------------------
            """

            # Ground-truth as mean value of RGB channels
            img_H = np.mean(img_H,axis=2)
            img_H = img_H[:,:,np.newaxis]

            # ---------------------------------
            # HWC to CHW, numpy(uint) to tensor
            # ---------------------------------
            img_H = util.uint2tensor3(img_H)
            img_L = util.uint2tensor3(img_L)

            # img_H = util.uint2single(img_H)

            # img_L = util.uint2single(img_L)

            
            # ---------------------------------
            # get noise level
            # ---------------------------------

            noise_level = torch.FloatTensor([int(self.sigma_test)])/255.0
            if self.sigma_test != 0:

                # noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0
            
                # ---------------------------------
                # add noise
                # ---------------------------------
                noise = torch.randn(img_L.size()).mul_(noise_level).float()
                img_L.add_(noise)


        noise_level = noise_level.unsqueeze(1).unsqueeze(1)


        return {'L': img_L, 'H': img_H, 'C': noise_level, 'L_path': L_path, 'H_path': H_path}

    def __len__(self):
        return len(self.paths_H)
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`import random`
			`import numpy as np`
			`import torch`
			`import torch.utils.data as data`
			`import utils.utils_image as util`
Add skip natural patches functionalities 2023-05-13 11:20:54 -07:00			`from utils.DTutils import is_natural_patch`
Added multiple patches per image for training (specifying num patches at train.json) 2023-03-29 13:05:44 -07:00			`import itertools`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00

			`class DatasetFFDNet(data.Dataset):`
			`"""`
			`# -----------------------------------------`
			`# Get L/H/M for denosing on AWGN with a range of sigma.`
			`# Only dataroot_H is needed.`
			`# -----------------------------------------`
			`# e.g., FFDNet, H = f(L, sigma), sigma is noise level`
			`# -----------------------------------------`
			`"""`

			`def __init__(self, opt):`
			`super(DatasetFFDNet, self).__init__()`
			`self.opt = opt`
			`self.n_channels = opt['n_channels'] if opt['n_channels'] else 3`
Fix: simulation for training dataset 2023-03-26 08:18:46 -07:00			`self.n_channels_datasetload = opt['n_channels_datasetload'] if opt['n_channels_datasetload'] else 3`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`self.patch_size = self.opt['H_size'] if opt['H_size'] else 64`
			`self.sigma = opt['sigma'] if opt['sigma'] else [0, 75]`
			`self.sigma_min, self.sigma_max = self.sigma[0], self.sigma[1]`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`self.sigma_test = opt['sigma_test'] if opt['sigma_test'] else 0`
Added support for all patches in image training 2023-04-17 18:06:48 -07:00			`self.use_all_patches = opt['use_all_patches'] if opt['use_all_patches'] else False`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`self.num_patches_per_image = opt['num_patches_per_image'] if opt['num_patches_per_image'] else 100`
			`# self.num_patches_per_image = opt['num_patches_per_image'] if not(self.use_all_patches) else ((12802)//(self.patch_size)2) ### HARDCODED`
Add skip natural patches functionalities 2023-05-13 11:20:54 -07:00			`self.skip_natural_patches = opt['skip_natural_patches'] if opt['skip_natural_patches'] else False`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`# -------------------------------------`
			`# get the path of H, return None if input is None`
			`# -------------------------------------`
Add skip natural patches functionalities 2023-05-13 11:20:54 -07:00			`self.paths_H = util.get_image_paths(opt['dataroot_H'])`
			`self.paths_L = util.get_image_paths(opt['dataroot_L'])`

Fix: simulated image stretch now before cropping 2023-04-02 16:02:12 -07:00			`# Repeat every image in path list to get more than one patch per image`
Added multiple patches per image for training (specifying num patches at train.json) 2023-03-29 13:05:44 -07:00			`if self.opt['phase'] == 'train':`
			`listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_H]`
			`self.paths_H = list(itertools.chain.from_iterable(listOfLists))`

			`listOfLists = [list(itertools.repeat(path, self.num_patches_per_image)) for path in self.paths_L]`
			`self.paths_L = list(itertools.chain.from_iterable(listOfLists))`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`def __getitem__(self, index):`
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`# -------------------------------------`
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00			`# get H and L image`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`# -------------------------------------`
			`H_path = self.paths_H[index]`
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00			`L_path = self.paths_L[index]`

			`H_file, L_file = H_path.split('/')[-1], L_path.split('/')[-1]`
			`H_name, L_name = H_file.split('.')[0], L_file.split('.')[0]`

Fix: dataset names error handling 2023-06-26 19:54:22 -07:00			`assert H_name==L_name, f'Both high and low quality images MUST have same name.\nGot {H_name} and {L_name} respectively.'`
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00
			`img_H = util.imread_uint(H_path, self.n_channels_datasetload)`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00
			`img_L = util.imread_uint(L_path, self.n_channels_datasetload)[:,:,:2]`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`# Temp solution for blanking images`
			`L_v, L_h = img_L.shape[:2]`

			`if L_v==1000 and L_h==1800:`
			`img_L = img_L[(1000-900)//2:-(1000-900)//2,(1800-1600)//2:-(1800-1600)//2,:]`

Fix: simulated image stretch now before cropping 2023-04-02 16:02:12 -07:00			`# Get module of complex image, stretch and to uint8`
Test scripts for both DnCNN and DRUNet for tempest 2023-04-06 15:31:46 -07:00			`# img_L = img_L.astype('float')`
			`# img_L = np.abs(img_L[:,:,0]+1j*img_L[:,:,1])`
			`# img_L = 255*(img_L - img_L.min())/(img_L.max() - img_L.min())`
			`# img_L = img_L.astype('uint8')`
Fix: simulated image stretch now before cropping 2023-04-02 16:02:12 -07:00
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`if self.opt['phase'] == 'train':`
			`"""`
			`# --------------------------------`
			`# get L/H/M patch pairs`
			`# --------------------------------`
			`"""`
			`H, W = img_H.shape[:2]`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00
			`if self.use_all_patches or (img_H.shape[0] <= self.patch_size) or (img_H.shape[1] <= self.patch_size):`
Added support for all patches in image training 2023-04-17 18:06:48 -07:00
			`# ---------------------------------`
			`# Start or continue image patching`
			`# ---------------------------------`
			`img_patch_index = index % self.num_patches_per_image # Resets to 0 every time index overflows num_patches`
FIX: patches now are properly selected 2023-04-19 16:45:11 -07:00
			`# Upper-left corner of patch`
			`h_index = self.patch_size * ( (img_patch_index * self.patch_size) // W)`
			`w_index = self.patch_size * ( ( (img_patch_index * self.patch_size) % W ) // self.patch_size)`

			`# Dont exceed the image limit`
			`h_index = min(h_index, H - self.patch_size)`
			`w_index = min(w_index, W - self.patch_size)`
Added support for all patches in image training 2023-04-17 18:06:48 -07:00
Add skip natural patches functionalities 2023-05-13 11:20:54 -07:00			`### Keep text patches only (non-natural images)`
			`if self.skip_natural_patches:`

			`# Check if selected patch is natural, based on RGB entropy`
			`is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])`

			`# If natural, select random patch and keep trying until non-natural or reaching max attempts`
			`attempt = 0`
			`max_attempts = 10`
			`while is_natural and (attempt < max_attempts):`
			`h_index = random.randint(0, max(0, H - self.patch_size))`
			`w_index = random.randint(0, max(0, W - self.patch_size))`
			`is_natural = is_natural_patch(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :])`
			`attempt += 1`


Added support for all patches in image training 2023-04-17 18:06:48 -07:00			`else:`
			`# ---------------------------------`
			`# randomly crop the patch`
			`# ---------------------------------`
FIX: patches now are properly selected 2023-04-19 16:45:11 -07:00			`h_index = random.randint(0, max(0, H - self.patch_size))`
			`w_index = random.randint(0, max(0, W - self.patch_size))`
WIP: added simulation scripts (GNURadio3.8) and modifying drunet training pre-processing 2023-03-20 19:00:33 -07:00
			`# Ground-truth as channels mean`
FIX: patches now are properly selected 2023-04-19 16:45:11 -07:00			`patch_H = np.mean(img_H[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size, :],axis=2)`
Fix: simulation for training dataset 2023-03-26 08:18:46 -07:00
WIP: adding support to train tempest attack data 2023-03-23 19:27:58 -07:00			`# Get the patch from the simulation`
FIX: patches now are properly selected 2023-04-19 16:45:11 -07:00			`patch_L = img_L[h_index:h_index + self.patch_size, w_index:w_index + self.patch_size,:]`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`# ---------------------------------`
			`# HWC to CHW, numpy(uint) to tensor`
			`# ---------------------------------`
			`img_H = util.uint2tensor3(patch_H)`
WIP: added simulation scripts (GNURadio3.8) and modifying drunet training pre-processing 2023-03-20 19:00:33 -07:00			`img_L = util.uint2tensor3(patch_L)`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`# ---------------------------------`
			`# get noise level`
			`# ---------------------------------`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`noise_level = torch.FloatTensor([int(np.random.uniform(self.sigma_min, self.sigma_max))])/255.0`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`# noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`if (self.sigma_max != 0):`
			`# ---------------------------------`
			`# add noise`
			`# ---------------------------------`
			`noise = torch.randn(img_L.size()).mul_(noise_level).float()`
			`img_L.add_(noise)`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`else:`
			`"""`
			`# --------------------------------`
			`# get L/H/sigma image pairs`
			`# --------------------------------`
			`"""`
WIP: adding support to train tempest attack data 2023-03-23 19:27:58 -07:00
			`# Ground-truth as mean value of RGB channels`
			`img_H = np.mean(img_H,axis=2)`
Modified dataset for drunet (loading both GT and simulations) 2023-03-27 09:07:44 -07:00			`img_H = img_H[:,:,np.newaxis]`
WIP: adding support to train tempest attack data 2023-03-23 19:27:58 -07:00
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`# ---------------------------------`
			`# HWC to CHW, numpy(uint) to tensor`
			`# ---------------------------------`
			`img_H = util.uint2tensor3(img_H)`
			`img_L = util.uint2tensor3(img_L)`

			`# img_H = util.uint2single(img_H)`
Training settings for abs value tempest 2023-03-29 15:33:45 -07:00
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`# img_L = util.uint2single(img_L)`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`# ---------------------------------`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00			`# get noise level`
Added KAIR and gitignore 2023-03-18 16:11:22 -07:00			`# ---------------------------------`
Changes for better training logs an visuals 2023-06-19 19:32:14 -07:00
			`noise_level = torch.FloatTensor([int(self.sigma_test)])/255.0`
			`if self.sigma_test != 0:`

			`# noise_level = torch.FloatTensor([np.random.randint(self.sigma_min, self.sigma_max)])/255.0`

			`# ---------------------------------`
			`# add noise`
			`# ---------------------------------`
			`noise = torch.randn(img_L.size()).mul_(noise_level).float()`
			`img_L.add_(noise)`


Added KAIR and gitignore 2023-03-18 16:11:22 -07:00
			`noise_level = noise_level.unsqueeze(1).unsqueeze(1)`


			`return {'L': img_L, 'H': img_H, 'C': noise_level, 'L_path': L_path, 'H_path': H_path}`

			`def __len__(self):`
			`return len(self.paths_H)`