pad_images must be in utils.py

Signed-off-by: João Lucas de Sousa Almeida <[email protected]>
IBM · romeokienzler · Jan 29, 2025 · Dec 23, 2024 · Jan 2, 2025 · Jan 2, 2025
commit 9c26eab4ea979c40f4bcf9b7da831d3e2f7efc8d
diff --git a/terratorch/models/backbones/prithvi_vit.py b/terratorch/models/backbones/prithvi_vit.py
@@ -10,6 +10,7 @@
 from terratorch.models.backbones.select_patch_embed_weights import select_patch_embed_weights
 from terratorch.datasets.utils import generate_bands_intervals
 from terratorch.models.backbones.prithvi_mae import PrithviViT, PrithviMAE
+from terratorch.models.utils import pad_images
 
 logger = logging.getLogger(__name__)
 
@@ -153,20 +154,6 @@ def checkpoint_filter_fn_mae(
 
     return state_dict
 
-
-def pad_images(imgs: Tensor,patch_size: int, padding:str) -> Tensor:
-    p = patch_size
-    # h, w = imgs.shape[3], imgs.shape[4]
-    t, h, w = imgs.shape[-3:]
-    h_pad, w_pad = (p - h % p) % p, (p - w % p) % p  # Ensure padding is within bounds
-    if h_pad > 0 or w_pad > 0:
-        imgs = torch.stack([
-            nn.functional.pad(img, (0, w_pad, 0, h_pad), mode=padding)
-            for img in imgs  # Apply per image to avoid NotImplementedError from torch.nn.functional.pad
-        ])
-    return imgs
-
-
 def _create_prithvi(
     variant: str,
     pretrained: bool = False,  # noqa: FBT001, FBT002

diff --git a/terratorch/models/pixel_wise_model.py b/terratorch/models/pixel_wise_model.py
@@ -8,7 +8,7 @@
 
 from terratorch.models.heads import RegressionHead, SegmentationHead
 from terratorch.models.model import AuxiliaryHeadWithDecoderWithoutInstantiatedHead, Model, ModelOutput
-from terratorch.models.backbones.prithvi_vit import pad_images
+from terratorch.models.utils import pad_images
 
 def freeze_module(module: nn.Module):
     for param in module.parameters():

diff --git a/terratorch/models/scalar_output_model.py b/terratorch/models/scalar_output_model.py
@@ -6,7 +6,7 @@
 
 from terratorch.models.heads import ClassificationHead
 from terratorch.models.model import AuxiliaryHeadWithDecoderWithoutInstantiatedHead, Model, ModelOutput
-
+from terratorch.models.utils import pad_images
 
 def freeze_module(module: nn.Module):
     for param in module.parameters():

diff --git a/terratorch/models/utils.py b/terratorch/models/utils.py
@@ -1,3 +1,6 @@
+import torch
+from torch import nn, Tensor
+
 class DecoderNotFoundError(Exception):
     pass
 
@@ -11,3 +14,16 @@ def extract_prefix_keys(d: dict, prefix: str) -> dict:
             remaining_dict[k] = v
 
     return extracted_dict, remaining_dict
+
+def pad_images(imgs: Tensor,patch_size: int, padding:str) -> Tensor:
+    p = patch_size
+    # h, w = imgs.shape[3], imgs.shape[4]
+    t, h, w = imgs.shape[-3:]
+    h_pad, w_pad = (p - h % p) % p, (p - w % p) % p  # Ensure padding is within bounds
+    if h_pad > 0 or w_pad > 0:
+        imgs = torch.stack([
+            nn.functional.pad(img, (0, w_pad, 0, h_pad), mode=padding)
+            for img in imgs  # Apply per image to avoid NotImplementedError from torch.nn.functional.pad
+        ])
+    return imgs
+