LCAV · ebezzam · Aug 29, 2023 · Jul 20, 2023 · Jul 20, 2023 · Jul 20, 2023
diff --git a/CHANGELOG.rst b/CHANGELOG.rst
@@ -22,6 +22,9 @@ Added
 - Script for measuring arbitrary dataset (from Raspberry Pi).
 - Support for preprocessing and postprocessing, such as denoising, in ``TrainableReconstructionAlgorithm``. Both trainable and fix postprocessing can be used.
 - Utilities to load a trained DruNet model for use as postprocessing in ``TrainableReconstructionAlgorithm``.
+- Unified interface for dataset. See ``utils.dataset.DualDataset``.
+- New simulated dataset compatible with new data format ([(batch_size), depth, width, height, color]). See ``utils.dataset.SimulatedDataset``.
+- New dataset for pair of original image and thair measurement from a screen. See ``utils.dataset.LenslessDataset``.
 - Support for unrolled loading and inference in the script ``admm.py``.
 - Tikhonov reconstruction for coded aperture measurements (MLS / MURA).
 

diff --git a/docs/requirements.txt b/docs/requirements.txt
@@ -4,4 +4,5 @@ docutils==0.16     # >0.17 doesn't render bullets
 numpy>=1.22      # so that default dtype are correctly rendered
 torch>=1.10
 torchvision>=0.15.2
-torchmetrics>=0.11.4
+torchmetrics>=0.11.4
+waveprop>=0.0.5
diff --git a/docs/source/conf.py b/docs/source/conf.py
@@ -28,14 +28,14 @@
     "pycsou.util",
     "pycsou.util.ptype",
     "PIL",
+    "PIL.Image",
     "tqdm",
     "paramiko",
     "paramiko.ssh_exception",
     "perlin_numpy",
-    "waveprop",
-    "waveprop.fresnel",
-    "waveprop.rs",
-    "waveprop.noise",
+    "scipy.special",
+    "matplotlib.cm",
+    "pyffs",
 ]
 for mod_name in MOCK_MODULES:
     sys.modules[mod_name] = mock.Mock()

diff --git a/docs/source/dataset.rst b/docs/source/dataset.rst
@@ -0,0 +1,23 @@
+Dataset objects (for training and testing)
+==========================================
+
+The software below provides functionality (with PyTorch) to load
+datasets for training and testing.
+
+.. automodule:: lensless.utils.dataset
+
+.. autoclass:: lensless.utils.dataset.DualDataset
+    :members: _get_images_pair
+    :special-members: __init__, __len__
+
+.. autoclass:: lensless.utils.dataset.LenslessDataset
+    :members:
+    :special-members: __init__
+
+.. autoclass:: lensless.utils.dataset.SimulatedFarFieldDataset
+    :members:
+    :special-members: __init__
+
+.. autoclass:: lensless.utils.dataset.DiffuserCamTestDataset
+    :members:
+    :special-members: __init__
diff --git a/docs/source/evaluation.rst b/docs/source/evaluation.rst
@@ -23,8 +23,4 @@
 
    .. automodule:: lensless.eval.benchmark
 
-   .. autoclass:: lensless.eval.benchmark.ParallelDataset
-      :members:
-      :special-members: __init__
-
    .. autofunction:: lensless.eval.benchmark.benchmark
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -35,6 +35,7 @@ Contents
 
    simulation
    data
+   dataset
 
 .. toctree::
    :hidden:

diff --git a/docs/source/simulation.rst b/docs/source/simulation.rst
@@ -16,6 +16,18 @@ library is used with the following simulation steps:
 
 PyTorch support is available to speed up simulation on GPU, and to create Dataset and DataLoader objects for training and testing!
 
+FarFieldSimulator
+------------------
+
+A wrapper around `waveprop.simulation.FarFieldSimulator <https://github.com/ebezzam/waveprop/blob/82dfb08b4db11c0c07ef00bdb59b5a769a49f0b3/waveprop/simulation.py#L11C11-L11C11>`__
+is implemented as :py:class:`lensless.utils.simulation.FarFieldSimulator`.
+It handles the conversion between the HWC and CHW dimension orderings so that the convention of LenslessPiCam can be maintained (namely HWC).
+
+.. autoclass:: lensless.utils.simulation.FarFieldSimulator
+    :members:
+    :special-members: __init__
+
+
 Simulating 3D data
 ------------------
 

diff --git a/lensless/eval/benchmark.py b/lensless/eval/benchmark.py
@@ -7,18 +7,14 @@
 # #############################################################################
 
 
-import glob
-import os
-from lensless.utils.io import load_psf
-from lensless.utils.image import resize
-import numpy as np
+from lensless.utils.dataset import DiffuserCamTestDataset
 from tqdm import tqdm
 
 from lensless.utils.io import load_image
 
 try:
     import torch
-    from torch.utils.data import Dataset, DataLoader
+    from torch.utils.data import DataLoader
     from torch.nn import MSELoss, L1Loss
     from torchmetrics import StructuralSimilarityIndexMeasure
     from torchmetrics.image import lpip, psnr
@@ -28,207 +24,6 @@
     )
 
 
-class ParallelDataset(Dataset):
-    """
-    Dataset consisting of lensless and corresponding lensed image.
-
-    It can be used with a PyTorch DataLoader to load a batch of lensless and corresponding lensed images.
-
-    """
-
-    def __init__(
-        self,
-        root_dir,
-        n_files=False,
-        background=None,
-        downsample=4,
-        flip=False,
-        transform_lensless=None,
-        transform_lensed=None,
-        lensless_fn="diffuser",
-        lensed_fn="lensed",
-        image_ext="npy",
-        **kwargs,
-    ):
-        """
-        Dataset consisting of lensless and corresponding lensed image. Default parameters are for the DiffuserCam
-        Lensless Mirflickr Dataset (DLMD).
-
-        Parameters
-        ----------
-
-            root_dir : str
-                Path to the test dataset. It is expected to contain two folders: ones of lensless images and one of lensed images.
-            n_files : int or None, optional
-                Metrics will be computed only on the first ``n_files`` images. If None, all images are used, by default False
-            background : :py:class:`~torch.Tensor` or None, optional
-                If not ``None``, background is removed from lensless images, by default ``None``.
-            downsample : int, optional
-                Downsample factor of the lensless images, by default 4.
-            flip : bool, optional
-                If ``True``, lensless images are flipped, by default ``False``.
-            transform_lensless : PyTorch Transform or None, optional
-                Transform to apply to the lensless images, by default None
-            transform_lensed : PyTorch Transform or None, optional
-                Transform to apply to the lensed images, by default None
-            lensless_fn : str, optional
-                Name of the folder containing the lensless images, by default "diffuser".
-            lensed_fn : str, optional
-                Name of the folder containing the lensed images, by default "lensed".
-            image_ext : str, optional
-                Extension of the images, by default "npy".
-        """
-
-        self.root_dir = root_dir
-        self.lensless_dir = os.path.join(root_dir, lensless_fn)
-        self.lensed_dir = os.path.join(root_dir, lensed_fn)
-        self.image_ext = image_ext.lower()
-
-        files = glob.glob(os.path.join(self.lensless_dir, "*." + image_ext))
-        if n_files:
-            files = files[:n_files]
-        self.files = [os.path.basename(fn) for fn in files]
-
-        if len(self.files) == 0:
-            raise FileNotFoundError(
-                f"No files found in {self.lensless_dir} with extension {image_ext}"
-            )
-
-        self.background = background
-        self.downsample = downsample / 4
-        self.flip = flip
-        self.transform_lensless = transform_lensless
-        self.transform_lensed = transform_lensed
-
-    def __len__(self):
-        return len(self.files)
-
-    def __getitem__(self, idx):
-        if torch.is_tensor(idx):
-            idx = idx.tolist()
-
-        if self.image_ext == "npy":
-            lensless_fp = os.path.join(self.lensless_dir, self.files[idx])
-            lensed_fp = os.path.join(self.lensed_dir, self.files[idx])
-            lensless = np.load(lensless_fp)
-            lensed = np.load(lensed_fp)
-        else:
-            # more standard image formats: png, jpg, tiff, etc.
-            lensless_fp = os.path.join(self.lensless_dir, self.files[idx])
-            lensed_fp = os.path.join(self.lensed_dir, self.files[idx])
-            lensless = load_image(lensless_fp)
-            lensed = load_image(lensed_fp)
-
-            # convert to float
-            if lensless.dtype == np.uint8:
-                lensless = lensless.astype(np.float32) / 255
-                lensed = lensed.astype(np.float32) / 255
-            else:
-                # 16 bit
-                lensless = lensless.astype(np.float32) / 65535
-                lensed = lensed.astype(np.float32) / 65535
-
-        if self.downsample != 1.0:
-            lensless = resize(lensless, factor=1 / self.downsample)
-            lensed = resize(lensed, factor=1 / self.downsample)
-
-        lensless = torch.from_numpy(lensless)
-        lensed = torch.from_numpy(lensed)
-
-        # If [H, W, C] -> [D, H, W, C]
-        if len(lensless.shape) == 3:
-            lensless = lensless.unsqueeze(0)
-        if len(lensed.shape) == 3:
-            lensed = lensed.unsqueeze(0)
-
-        if self.background is not None:
-            lensless = lensless - self.background
-
-        # flip image x and y if needed
-        if self.flip:
-            lensless = torch.rot90(lensless, dims=(-3, -2))
-            lensed = torch.rot90(lensed, dims=(-3, -2))
-        if self.transform_lensless:
-            lensless = self.transform_lensless(lensless)
-
-        if self.transform_lensed:
-            lensed = self.transform_lensed(lensed)
-
-        return lensless, lensed
-
-
-class DiffuserCamTestDataset(ParallelDataset):
-    """
-    Dataset consisting of lensless and corresponding lensed image. This is the standard dataset used for benchmarking.
-    """
-
-    def __init__(
-        self,
-        data_dir="data",
-        n_files=200,
-        downsample=8,
-    ):
-        """
-        Dataset consisting of lensless and corresponding lensed image. Default parameters are for the test set of DiffuserCam
-        Lensless Mirflickr Dataset (DLMD).
-
-        Parameters
-        ----------
-        data_dir : str, optional
-            The path to the folder containing the DiffuserCam_Test dataset, by default "data"
-        n_files : int, optional
-            Number of image pair to load in the dataset , by default 200
-        downsample : int, optional
-            Downsample factor of the lensless images, by default 8
-        """
-        # download dataset if necessary
-        main_dir = data_dir
-        data_dir = os.path.join(data_dir, "DiffuserCam_Test")
-        if not os.path.isdir(data_dir):
-            print("No dataset found for benchmarking.")
-            try:
-                from torchvision.datasets.utils import download_and_extract_archive
-            except ImportError:
-                exit()
-            msg = "Do you want to download the sample dataset (3.5GB)?"
-
-            # default to yes if no input is given
-            valid = input("%s (Y/n) " % msg).lower() != "n"
-            if valid:
-                url = "https://drive.switch.ch/index.php/s/D3eRJ6PRljfHoH8/download"
-                filename = "DiffuserCam_Test.zip"
-                download_and_extract_archive(url, main_dir, filename=filename, remove_finished=True)
-
-        psf_fp = os.path.join(data_dir, "psf.tiff")
-        psf, background = load_psf(
-            psf_fp,
-            downsample=downsample,
-            return_float=True,
-            return_bg=True,
-            bg_pix=(0, 15),
-        )
-
-        # transform from BGR to RGB
-        from torchvision import transforms
-
-        transform_BRG2RGB = transforms.Lambda(lambda x: x[..., [2, 1, 0]])
-
-        self.psf = transform_BRG2RGB(torch.from_numpy(psf))
-
-        super().__init__(
-            data_dir,
-            n_files,
-            background,
-            downsample,
-            flip=False,
-            transform_lensless=transform_BRG2RGB,
-            transform_lensed=transform_BRG2RGB,
-            lensless_fn="diffuser",
-            lensed_fn="lensed",
-            image_ext="npy",
-        )
-
-
 def benchmark(model, dataset, batchsize=1, metrics=None, **kwargs):
     """
     Compute multiple metrics for a reconstruction algorithm.

diff --git a/lensless/hardware/mask.py b/lensless/hardware/mask.py
@@ -25,8 +25,7 @@
 from perlin_numpy import generate_perlin_noise_2d
 from sympy.ntheory import quadratic_residues
 from scipy.signal import max_len_seq
-from scipy.linalg import circulant
-from numpy.linalg import multi_dot
+from scipy.linalg import circulant, multi_dot
 from waveprop.fresnel import fresnel_conv
 from waveprop.rs import angular_spectrum
 from waveprop.noise import add_shot_noise