update UPerNet decoder

brianhou0208 · brianhou0208 · commit 8d1e565a01ba · 2024-09-22T16:50:41.000+08:00
Resize all FPN output features to 1/4 of the original resolution.
diff --git a/segmentation_models_pytorch/decoders/upernet/decoder.py b/segmentation_models_pytorch/decoders/upernet/decoder.py
@@ -113,8 +113,8 @@ def __init__(
         )
 
     def forward(self, *features):
-        # Resize all FPN features to the size of the largest feature
-        target_size = features[0].shape[2:]
+        output_size = features[0].shape[2:]
+        target_size = [size // 4 for size in output_size]
 
         features = features[1:]  # remove first skip with same spatial resolution
         features = features[::-1]  # reverse channels to start from head of encoder
@@ -126,6 +126,7 @@ def forward(self, *features):
             fpn_feature = stage(fpn_features[-1], feature)
             fpn_features.append(fpn_feature)
 
+        # Resize all FPN features to 1/4 of the original resolution.
         resized_fpn_features = []
         for feature in fpn_features:
             resized_feature = F.interpolate(
@@ -134,5 +135,8 @@ def forward(self, *features):
             resized_fpn_features.append(resized_feature)
 
         output = self.fpn_bottleneck(torch.cat(resized_fpn_features, dim=1))
+        output = F.interpolate(
+            output, size=output_size, mode="bilinear", align_corners=False
+        )
 
         return output