more tests

wyli · wyli · commit 7593660a8e57 · 2023-03-31T12:17:04.000-04:00
Signed-off-by: Wenqi Li &lt;wenqil@nvidia.com&gt;
diff --git a/monai/inferers/inferer.py b/monai/inferers/inferer.py
@@ -366,6 +366,9 @@ class SlidingWindowInferer(Inferer):
         cpu_thresh: when provided, dynamically switch to stitching on cpu (to save gpu memory)
             when input image volume is larger than this threshold (in pixels/voxels).
             Otherwise use ``"device"``. Thus, the output may end-up on either cpu or gpu.
+        buffer_steps: the number of sliding window iterations before writing the outputs to ``device``.
+            default is None, no buffer.
+        buffer_dim: the dimension along which the buffer are created, default is 0.
 
     Note:
         ``sw_batch_size`` denotes the max number of windows per network inference iteration,
@@ -387,6 +390,8 @@ def __init__(
         progress: bool = False,
         cache_roi_weight_map: bool = False,
         cpu_thresh: int | None = None,
+        buffer_steps: int | None = None,
+        buffer_dim: int = 0,
     ) -> None:
         super().__init__()
         self.roi_size = roi_size
@@ -400,6 +405,8 @@ def __init__(
         self.device = device
         self.progress = progress
         self.cpu_thresh = cpu_thresh
+        self.buffer_steps = buffer_steps
+        self.buffer_dim = buffer_dim
 
         # compute_importance_map takes long time when computing on cpu. We thus
         # compute it once if it's static and then save it for future usage
@@ -456,6 +463,8 @@ def __call__(
             self.progress,
             self.roi_weight_map,
             None,
+            self.buffer_steps,
+            self.buffer_dim,
             *args,
             **kwargs,
         )
diff --git a/monai/inferers/utils.py b/monai/inferers/utils.py
@@ -53,6 +53,8 @@ def sliding_window_inference(
     progress: bool = False,
     roi_weight_map: torch.Tensor | None = None,
     process_fn: Callable | None = None,
+    buffer_steps: int | None = None,
+    buffer_dim: int = 0,
     *args: Any,
     **kwargs: Any,
 ) -> torch.Tensor | tuple[torch.Tensor, ...] | dict[Any, torch.Tensor]:
@@ -114,26 +116,23 @@ def sliding_window_inference(
         roi_weight_map: pre-computed (non-negative) weight map for each ROI.
             If not given, and ``mode`` is not `constant`, this map will be computed on the fly.
         process_fn: process inference output and adjust the importance map per window
+        buffer_steps: the number of sliding window iterations before writing the outputs to ``device``.
+            default is None, no buffer.
+        buffer_dim: the dimension along which the buffer are created, default is 0.
         args: optional args to be passed to ``predictor``.
         kwargs: optional keyword args to be passed to ``predictor``.
 
-            - buffer_steps: the number of sliding window iterations before writing the outputs to ``device``.
-              default is None, no buffer.
-            - buffer_dim: the dimension along which the buffer are created, default is 0.
-
     Note:
         - input must be channel-first and have a batch dim, supports N-D sliding window.
 
     """
-    b_steps = kwargs.pop("buffer_steps", None)
-    b_plane = kwargs.pop("buffer_dim", 0)
-    buffered = b_steps is not None and b_steps > 0
+    buffered = buffer_steps is not None and buffer_steps > 0
     num_spatial_dims = len(inputs.shape) - 2
     if buffered:
-        if b_plane < -num_spatial_dims + 1 or b_plane > num_spatial_dims:
-            raise ValueError(f"buffer_dim must be in [{-num_spatial_dims + 1}, {num_spatial_dims}], got {b_plane}.")
-        if b_steps <= 0:
-            raise ValueError(f"buffer_steps must be >= 0, got {b_steps}.")
+        if buffer_dim < -num_spatial_dims + 1 or buffer_dim > num_spatial_dims:
+            raise ValueError(f"buffer_dim must be in [{-num_spatial_dims + 1}, {num_spatial_dims}], got {buffer_dim}.")
+        if buffer_steps <= 0:  # type: ignore
+            raise ValueError(f"buffer_steps must be >= 0, got {buffer_steps}.")
     if overlap < 0 or overlap >= 1:
         raise ValueError(f"overlap must be >= 0 and < 1, got {overlap}.")
     compute_dtype = inputs.dtype
@@ -165,25 +164,31 @@ def sliding_window_inference(
     slices = dense_patch_slices(image_size, roi_size, scan_interval, return_slice=False)
 
     slices_np = np.asarray(slices)
-    if b_plane < 0:
-        b_plane += num_spatial_dims
-    slices_np = slices_np[np.argsort(slices_np[:, b_plane, 0], kind="mergesort")]
+    if buffer_dim < 0:
+        buffer_dim += num_spatial_dims
+    slices_np = slices_np[np.argsort(slices_np[:, buffer_dim, 0], kind="mergesort")]
     slices = [tuple(slice(c[0], c[1]) for c in i) for i in slices_np]
-    _, _p_id, _b_lens = np.unique(slices_np[:, b_plane, 0], return_counts=True, return_index=True)
-    b_se = [tuple(slices_np[i][b_plane]) for i in _p_id]  # buffer start & end along the b_plane
-    b_ends = np.cumsum(np.repeat(_b_lens, batch_size))  # buffer flush boundaries
+    _, _p_id, _b_lens = np.unique(slices_np[:, buffer_dim, 0], return_counts=True, return_index=True)
+    _b_se = [tuple(slices_np[i][buffer_dim]) for i in _p_id]  # buffer start & end along the buffer_dim
+    b_ends = np.cumsum(_b_lens).tolist()  # possible buffer flush boundaries
 
     num_win = len(slices)  # number of windows per image
     total_slices = num_win * batch_size  # total number of windows
     windows_range: Iterable
     if not buffered:
         windows_range = range(0, total_slices, sw_batch_size)
     else:
-        b_steps = min(len(b_se), b_steps)
-        x = [0, *b_ends][::b_steps]
+        buffer_steps = min(len(_b_se), int(buffer_steps))  # type: ignore
+        x = [0, *b_ends][::buffer_steps]
         if x[-1] < b_ends[-1]:
             x.append(b_ends[-1])
-        windows_range = itertools.chain(*[range(x[i], x[i + 1], sw_batch_size) for i in range(len(x) - 1)])
+        windows_range, n_per_batch, b_ends = [], len(x) - 1, [0]
+        for b in range(batch_size):
+            offset = b * x[-1]
+            for i in range(n_per_batch):
+                windows_range.append(range(offset + x[i], offset + x[i + 1], sw_batch_size))
+                b_ends.append(offset + x[i + 1])
+        windows_range = itertools.chain(*windows_range)
 
     # Create window-level importance map
     valid_patch_size = get_valid_patch_size(image_size, roi_size)
@@ -206,8 +211,7 @@ def sliding_window_inference(
     output_image_list, count_map_list, sw_device_buffer, b_s, b_i = [], [], [], 0, 0  # type: ignore
     # for each patch
     for slice_g in tqdm(windows_range) if progress else windows_range:
-        _cur_max = b_ends[b_s + b_steps - 1] if buffered else total_slices
-        slice_range = range(slice_g, min(slice_g + sw_batch_size, _cur_max))
+        slice_range = range(slice_g, min(slice_g + sw_batch_size, b_ends[b_s + 1] if buffered else total_slices))
         unravel_slice = [
             [slice(idx // num_win, idx // num_win + 1), slice(None)] + list(slices[idx % num_win])
             for idx in slice_range
@@ -223,22 +227,21 @@ def sliding_window_inference(
             importance_map = importance_map_
 
         if buffered:
-            # if len(seg_tuple) > 1:
-            #     warnings.warn("Multiple outputs are not supported with buffer_steps")
-            c_start, c_end = b_se[b_s % len(b_se)], b_se[(b_s + b_steps - 1) % len(b_se)]
+            c_start = slices_np[b_ends[b_s] % num_win, buffer_dim, 0]
+            c_end = slices_np[(b_ends[b_s + 1] - 1) % num_win, buffer_dim, 1]
             if not sw_device_buffer:
-                k = seg_tuple[0].shape[1]
+                k = seg_tuple[0].shape[1]  # len(seg_tuple) > 1 is currently ignored
                 sp_size = list(image_size)
-                sp_size[b_plane] = max(c_end[1] - c_start[0], roi_size[b_plane])
+                sp_size[buffer_dim] = c_end - c_start
                 sw_device_buffer = [torch.zeros(size=[1, k, *sp_size], dtype=compute_dtype, device=sw_device)]
                 importance_map = importance_map.to(dtype=compute_dtype, device=sw_device)
             for p, s in zip(seg_tuple[0], unravel_slice):
-                offset = s[b_plane + 2].start - c_start[0]
-                s[b_plane + 2] = slice(offset, offset + roi_size[b_plane])
+                offset = s[buffer_dim + 2].start - c_start
+                s[buffer_dim + 2] = slice(offset, offset + roi_size[buffer_dim])
                 s[0] = slice(0, 1)
                 sw_device_buffer[0][s] += p * importance_map
             b_i += len(unravel_slice)
-            if b_i < b_ends[b_s + b_steps - 1]:
+            if b_i < b_ends[b_s + 1]:
                 continue
         else:
             sw_device_buffer = seg_tuple
@@ -269,8 +272,8 @@ def sliding_window_inference(
                 w_t = w_t.to(sw_device)
             if buffered:
                 o_slice = [slice(None)] * len(inputs.shape)
-                o_slice[b_plane + 2] = slice(c_start[0], c_end[1])
-                img_b = b_s // len(b_se)  # image batch index
+                o_slice[buffer_dim + 2] = slice(c_start, c_end)
+                img_b = b_s // n_per_batch  # image batch index
                 o_slice[0] = slice(img_b, img_b + 1)
                 output_image_list[0][o_slice] += sw_device_buffer[0].to(device=device)
             else:
@@ -280,7 +283,7 @@ def sliding_window_inference(
                 _compute_coords(sw_batch_size, unravel_slice, z_scale, output_image_list[ss], sw_t)
         sw_device_buffer = []
         if buffered:
-            b_s += b_steps
+            b_s += 1
 
     # account for any overlapping sections
     for ss in range(len(output_image_list)):
diff --git a/tests/test_sliding_window_inference.py b/tests/test_sliding_window_inference.py
@@ -244,6 +244,8 @@ def compute(data, test1, test2):
             has_tqdm,
             None,
             None,
+            None,
+            0,
             t1,
             test2=t2,
         )

Original file line number	Diff line number	Diff line change
`@@ -244,6 +244,8 @@ def compute(data, test1, test2):`
`244`	`244`	`has_tqdm,`
`245`	`245`	`None,`
`246`	`246`	`None,`
	`247`	`+ None,`
	`248`	`+ 0,`
`247`	`249`	`t1,`
`248`	`250`	`test2=t2,`
`249`	`251`	`)`