DiamondLightSource · yousefmoazzam · Apr 27, 2026 · Apr 27, 2026 · Apr 27, 2026 · Apr 27, 2026
diff --git a/httomo/runner/dataset_store_backing.py b/httomo/runner/dataset_store_backing.py
@@ -5,18 +5,19 @@
 from numpy.typing import DTypeLike
 from mpi4py import MPI
 
+from httomo.data.hdf._utils.reslice import reslice_memory_estimator
 from httomo.runner.section import Section, determine_section_padding
 from httomo.utils import _get_slicing_dim, make_3d_shape_from_shape
 
 
-def calculate_section_chunk_shape(
+def calculate_section_input_chunk_shape(
     comm: MPI.Comm,
     global_shape: Tuple[int, int, int],
     slicing_dim: int,
     padding: Tuple[int, int],
 ) -> Tuple[int, int, int]:
     """
-    Calculate chunk shape (w/ or w/o padding) for a section.
+    Calculate the shape of the section input chunk w/ or w/o padding.
     """
     start = round((global_shape[slicing_dim] / comm.size) * comm.rank)
     stop = round((global_shape[slicing_dim] / comm.size) * (comm.rank + 1))
@@ -26,53 +27,37 @@ def calculate_section_chunk_shape(
     return make_3d_shape_from_shape(shape)
 
 
-def calculate_section_chunk_bytes(
+def calculate_section_output_chunk_shape(
     chunk_shape: Tuple[int, int, int],
-    dtype: DTypeLike,
     section: Section,
-) -> int:
+) -> Tuple[int, int, int]:
     """
-    Calculate the number of bytes in the section output chunk that is written to the store. Ths
-    accounts for data's non-slicing dims changing during processing, which changes the chunk
-    shape for the section and thus affects the number of bytes in the chunk.
+    Calculate the shape of the section output chunk that is written to the store. This
+    accounts for the data's non-slicing dims changing during processing, which changes the
+    chunk shape for the section.
     """
     slicing_dim = _get_slicing_dim(section.pattern) - 1
     non_slice_dims_list = list(chunk_shape)
     non_slice_dims_list.pop(slicing_dim)
-    non_slice_dims = (non_slice_dims_list[0], non_slice_dims_list[1])
+    input_non_slice_dims = (non_slice_dims_list[0], non_slice_dims_list[1])
+    output_non_slice_dims = input_non_slice_dims
 
     for method in section.methods:
         if method.memory_gpu is None:
             continue
-        non_slice_dims = method.calculate_output_dims(non_slice_dims)
+        output_non_slice_dims = method.calculate_output_dims(input_non_slice_dims)
 
-    return int(
-        np.prod(non_slice_dims) * chunk_shape[slicing_dim] * np.dtype(dtype).itemsize
-    )
+    output_chunk_shape = list(output_non_slice_dims)
+    output_chunk_shape.insert(slicing_dim, chunk_shape[slicing_dim])
+
+    return make_3d_shape_from_shape(output_chunk_shape)
 
 
 class DataSetStoreBacking(Enum):
     RAM = 1
     File = 2
 
 
-def _non_last_section_in_pipeline(
-    memory_limit_bytes: int,
-    write_chunk_bytes: int,
-    read_chunk_bytes: int,
-) -> DataSetStoreBacking:
-    """
-    Calculate backing of dataset store for non-last sections in pipeline
-    """
-    if (
-        memory_limit_bytes > 0
-        and write_chunk_bytes + read_chunk_bytes >= memory_limit_bytes
-    ):
-        return DataSetStoreBacking.File
-
-    return DataSetStoreBacking.RAM
-
-
 def determine_store_backing(
     comm: MPI.Comm,
     sections: List[Section],
@@ -84,7 +69,7 @@ def determine_store_backing(
     # Get chunk shape created by reader of section `n` (the current section) that will account
     # for padding. This chunk shape is based on the chunk shape written by the writer of
     # section `n - 1` (the previous section)
-    padded_input_chunk_shape = calculate_section_chunk_shape(
+    padded_input_chunk_shape = calculate_section_input_chunk_shape(
         comm=comm,
         global_shape=global_shape,
         slicing_dim=_get_slicing_dim(sections[section_idx].pattern) - 1,
@@ -96,7 +81,7 @@ def determine_store_backing(
 
     # Get unpadded chunk shape input to current section (for calculation of bytes in output
     # chunk for the current section)
-    input_chunk_shape = calculate_section_chunk_shape(
+    input_chunk_shape = calculate_section_input_chunk_shape(
         comm=comm,
         global_shape=global_shape,
         slicing_dim=_get_slicing_dim(sections[section_idx].pattern) - 1,
@@ -106,21 +91,38 @@ def determine_store_backing(
     # Get the number of bytes in the input chunk to the section w/ potential modifications to
     # the non-slicing dims, to then determine the number of bytes in the output chunk written
     # by the current section
-    output_chunk_bytes = calculate_section_chunk_bytes(
+    output_chunk_shape = calculate_section_output_chunk_shape(
         chunk_shape=input_chunk_shape,
-        dtype=dtype,
         section=sections[section_idx],
     )
+    output_chunk_bytes = int(np.prod(output_chunk_shape) * np.dtype(dtype).itemsize)
+
+    # If a reslice operation would occur in moving from the current section to the next
+    # section, then calculate the number of bytes the reslice operation would take, given the
+    # input to it (which would be the output chunk of the current section)
+    reslice_bytes = 0
+    if (
+        comm.size > 1
+        and section_idx < len(sections) - 1
+        and sections[section_idx].pattern != sections[section_idx + 1].pattern
+    ):
+        ring_algorithm_bytes, reslice_output_bytes = reslice_memory_estimator(
+            output_chunk_shape,
+            dtype,
+            _get_slicing_dim(sections[section_idx].pattern),
+            _get_slicing_dim(sections[section_idx + 1].pattern),
+            comm,
+        )
+        reslice_bytes += ring_algorithm_bytes + reslice_output_bytes
 
     send_buffer = np.zeros(1, dtype=bool)
     recv_buffer = np.zeros(1, dtype=bool)
-    store_backing = _non_last_section_in_pipeline(
-        memory_limit_bytes=memory_limit_bytes,
-        read_chunk_bytes=padded_input_chunk_bytes,
-        write_chunk_bytes=output_chunk_bytes,
-    )
 
-    if store_backing is DataSetStoreBacking.File:
+    if (
+        memory_limit_bytes > 0
+        and padded_input_chunk_bytes + output_chunk_bytes + reslice_bytes
+        >= memory_limit_bytes
+    ):
         send_buffer[0] = True
 
     # do a logical OR of all the enum variants across the processes