make it 2D/3D compartible, rm a outdated comment

Can-Zhao · Can-Zhao · commit 8555b674a4e0 · 2025-03-10T14:56:52.000Z
Signed-off-by: Can-Zhao &lt;volcanofly@gmail.com&gt;
diff --git a/monai/networks/schedulers/rectified_flow.py b/monai/networks/schedulers/rectified_flow.py
@@ -174,10 +174,15 @@ def add_noise(self, original_samples: torch.Tensor, noise: torch.Tensor, timeste
         timepoints: torch.Tensor = timesteps.float() / self.num_train_timesteps
         timepoints = 1 - timepoints  # [1,1/1000]
 
-        # timepoint  (bsz) noise: (bsz, 4, frame, w ,h)
         # expand timepoint to noise shape
-        timepoints = timepoints.unsqueeze(1).unsqueeze(1).unsqueeze(1).unsqueeze(1)
-        timepoints = timepoints.repeat(1, noise.shape[1], noise.shape[2], noise.shape[3], noise.shape[4])
+        if len(noise.shape) == 5:
+            timepoints = timepoints.unsqueeze(1).unsqueeze(1).unsqueeze(1).unsqueeze(1)
+            timepoints = timepoints.repeat(1, noise.shape[1], noise.shape[2], noise.shape[3], noise.shape[4])
+        elif len(noise.shape) == 4:
+            timepoints = timepoints.unsqueeze(1).unsqueeze(1).unsqueeze(1)
+            timepoints = timepoints.repeat(1, noise.shape[1], noise.shape[2], noise.shape[3])
+        else:
+            raise ValueError(f"noise has to be 4D or 5D tensor. yet got shape of {noise.shape}.")
         noisy_samples: torch.Tensor = timepoints * original_samples + (1 - timepoints) * noise
 
         return noisy_samples
@@ -246,7 +251,7 @@ def sample_timesteps(self, x_start):
             t = t.long()
 
         if self.use_timestep_transform:
-            input_img_size_numel = torch.prod(torch.tensor(x_start.shape[-3:]))
+            input_img_size_numel = torch.prod(torch.tensor(x_start.shape[2:]))
             t = timestep_transform(
                 t,
                 input_img_size_numel=input_img_size_numel,