DiamondLightSource · dkazanc · May 28, 2024 · yousefmoazzam · May 30, 2024 · dkazanc
diff --git a/httomo/methods_database/packages/external/httomolibgpu/httomolibgpu.yaml b/httomo/methods_database/packages/external/httomolibgpu/httomolibgpu.yaml
@@ -120,6 +120,15 @@ recon:
         - datasets: [tomo]
         - multipliers: [None]
         - methods: [module]
+    LPRec:
+      pattern: sinogram
+      output_dims_change: True
+      implementation: gpu_cupy
+      save_result_default: True
+      memory_gpu:
+        - datasets: [tomo]
+        - multipliers: [None]
+        - methods: [module]
     SIRT:
       pattern: sinogram
       output_dims_change: True

diff --git a/httomo/methods_database/packages/external/httomolibgpu/supporting_funcs/recon/algorithm.py b/httomo/methods_database/packages/external/httomolibgpu/supporting_funcs/recon/algorithm.py
@@ -27,9 +27,11 @@
 
 __all__ = [
     "_calc_memory_bytes_FBP",
+    "_calc_memory_bytes_LPRec",
     "_calc_memory_bytes_SIRT",
     "_calc_memory_bytes_CGLS",
     "_calc_output_dim_FBP",
+    "_calc_output_dim_LPRec",
     "_calc_output_dim_SIRT",
     "_calc_output_dim_CGLS",
 ]
@@ -53,6 +55,10 @@ def _calc_output_dim_FBP(non_slice_dims_shape, **kwargs):
     return __calc_output_dim_recon(non_slice_dims_shape, **kwargs)
 
 
+def _calc_output_dim_LPRec(non_slice_dims_shape, **kwargs):
+    return __calc_output_dim_recon(non_slice_dims_shape, **kwargs)
+
+
 def _calc_output_dim_SIRT(non_slice_dims_shape, **kwargs):
     return __calc_output_dim_recon(non_slice_dims_shape, **kwargs)
 
@@ -82,11 +88,82 @@ def _calc_memory_bytes_FBP(
     astra_out_size = np.prod(output_dims) * np.float32().itemsize
 
     tot_memory_bytes = int(
-        2 * in_slice_size
+        3 * in_slice_size
         + filtered_in_data
         + freq_slice
         + fftplan_size
-        + 3.5 * astra_out_size
+        + astra_out_size
+    )
+    return (tot_memory_bytes, filter_size)
+
+
+def _calc_memory_bytes_LPRec(
+    non_slice_dims_shape: Tuple[int, int],
+    dtype: np.dtype,
+    **kwargs,
+) -> Tuple[int, int]:
+    angles_tot = non_slice_dims_shape[0]
+    DetectorsLengthH = non_slice_dims_shape[1]
+    # calculate the output shape
+    output_dims = _calc_output_dim_LPRec(non_slice_dims_shape, **kwargs)
+
+    in_slice_size = np.prod(non_slice_dims_shape) * dtype.itemsize
+    out_slice_size = np.prod(DetectorsLengthH * DetectorsLengthH) * dtype.itemsize
+
+    # interpolation kernels
+    grid_size = np.prod(DetectorsLengthH * DetectorsLengthH) * np.float32().nbytes
+    phi = grid_size
+
+    eps = 1e-3  # accuracy of usfft
+    mu = -np.log(eps) / (2 * DetectorsLengthH * DetectorsLengthH)
+    m = int(
+        np.ceil(
+            2
+            * DetectorsLengthH
+            * 1
+            / np.pi
+            * np.sqrt(
+                -mu * np.log(eps)
+                + (mu * DetectorsLengthH) * (mu * DetectorsLengthH) / 4
+            )
+        )
+    )
+    oversampling_level = 2
+    tmp_oversample_size = (
+        np.prod(angles_tot * oversampling_level * DetectorsLengthH)
+        * np.float32().nbytes
+    )
+
+    data_c_size = np.prod(0.5 * angles_tot * DetectorsLengthH) * np.complex64().itemsize
+
+    fde_size = (
+        (2 * m + 2 * DetectorsLengthH) * (2 * m + 2 * DetectorsLengthH)
+    ) * np.complex64().itemsize
+
+    fde2_size = (
+        (2 * DetectorsLengthH) * (2 * DetectorsLengthH)
+    ) * np.complex64().itemsize
+
+    c2dfftshift_slice_size = (
+        np.prod(4 * DetectorsLengthH * DetectorsLengthH) * np.int8().nbytes
+    )
+
+    filter_size = (DetectorsLengthH // 2 + 1) * np.float32().itemsize
+    freq_slice = angles_tot * (DetectorsLengthH + 1) * np.complex64().itemsize
+    fftplan_size = freq_slice * 2
+
+    tot_memory_bytes = int(
+        in_slice_size
+        + out_slice_size
+        + 2 * grid_size
+        + phi
+        + tmp_oversample_size
+        + data_c_size
+        + fde_size
+        + fde2_size
+        + c2dfftshift_slice_size
+        + freq_slice
+        + fftplan_size
     )
     return (tot_memory_bytes, filter_size)
 

diff --git a/tests/test_backends/test_httomolibgpu.py b/tests/test_backends/test_httomolibgpu.py
@@ -27,7 +27,7 @@
 )
 from httomolibgpu.prep.stripe import remove_stripe_based_sorting, remove_stripe_ti
 from httomolibgpu.misc.corr import remove_outlier
-from httomolibgpu.recon.algorithm import FBP, SIRT, CGLS
+from httomolibgpu.recon.algorithm import FBP, LPRec, SIRT, CGLS
 from httomolibgpu.misc.rescale import rescale_to_int
 
 from httomo.methods_database.packages.external.httomolibgpu.supporting_funcs.misc.morph import *
@@ -447,7 +447,45 @@ def test_recon_FBP_memoryhook(slices, recon_size_it, ensure_clean_memory):
     # the estimated_memory_mb should be LARGER or EQUAL to max_mem_mb
     # the resulting percent value should not deviate from max_mem on more than 20%
     assert estimated_memory_mb >= max_mem_mb
-    assert percents_relative_maxmem <= 35
+    assert percents_relative_maxmem <= 20
+
+
+@pytest.mark.cupy
+@pytest.mark.parametrize("slices", [4, 7])
+def test_recon_LPRec_memoryhook(slices, ensure_clean_memory):
+    data = cp.random.random_sample((1801, slices, 2560), dtype=np.float32)
+    kwargs = {}
+    kwargs["angles"] = np.linspace(
+        0.0 * np.pi / 180.0, 180.0 * np.pi / 180.0, data.shape[0]
+    )
+    kwargs["center"] = 500
+    kwargs["recon_size"] = 2560
+    kwargs["recon_mask_radius"] = 0.8
+
+    hook = MaxMemoryHook()
+    with hook:
+        recon_data = LPRec(cp.copy(data), **kwargs)
+
+    # make sure estimator function is within range (80% min, 100% max)
+    max_mem = (
+        hook.max_mem
+    )  # the amount of memory in bytes needed for the method according to memoryhook
+
+    # now we estimate how much of the total memory required for this data
+    (estimated_memory_bytes, subtract_bytes) = _calc_memory_bytes_LPRec(
+        (1801, 2560), dtype=np.float32(), **kwargs
+    )
+    estimated_memory_mb = round(slices * estimated_memory_bytes / (1024**2), 2)
+    max_mem -= subtract_bytes
+    max_mem_mb = round(max_mem / (1024**2), 2)
+
+    # now we compare both memory estimations
+    difference_mb = abs(estimated_memory_mb - max_mem_mb)
+    percents_relative_maxmem = round((difference_mb / max_mem_mb) * 100)
+    # the estimated_memory_mb should be LARGER or EQUAL to max_mem_mb
+    # the resulting percent value should not deviate from max_mem on more than 20%
+    assert estimated_memory_mb >= max_mem_mb
+    assert percents_relative_maxmem <= 20
 
 
 @pytest.mark.cupy