Data augmentation for semantic segmentation for flash #1232

andife · 2022-03-15T12:57:10Z

andife
Mar 15, 2022

Hello,

I'm trying to use a more advanced/specific image augmentation setup for a pytorch-flash task.
As starting point I look at the following examples and combined them:

#1107
https://lightning-flash.readthedocs.io/en/stable/reference/semantic_segmentation.html


import torch

import flash
from flash.core.data.utils import download_data
from flash.image import SemanticSegmentation, SemanticSegmentationData

##################################################################################################################
from dataclasses import dataclass
import albumentations as alb
from icevision.tfms import A
from flash import InputTransform
from flash.core.integrations.icevision.transforms import IceVisionTransformAdapter

@dataclass
class BrightnessContrastTransform(InputTransform):
    image_size: int = 128

    def per_sample_transform(self):
        return IceVisionTransformAdapter(
            [*A.aug_tfms(size=self.image_size), A.Normalize(), alb.RandomBrightnessContrast()]
        )


##################################################################################################################


# 1. Create the DataModule
# The data was generated with the  CARLA self-driving simulator as part of the Kaggle Lyft Udacity Challenge.
# More info here: https://www.kaggle.com/kumaresanmanickavelu/lyft-udacity-challenge
download_data(
    "https://github.com/ongchinkiat/LyftPerceptionChallenge/releases/download/v0.1/carla-capture-20180513A.zip",
    "./data",
)

datamodule = SemanticSegmentationData.from_folders(
    train_folder="data/CameraRGB",
    train_target_folder="data/CameraSeg",
    val_split=0.1,
    train_transform=BrightnessContrastTransform,
    transform_kwargs=dict(image_size=(256, 256)),
    num_classes=21,
    batch_size=4,
)

# 2. Build the task
model = SemanticSegmentation(
    backbone="mobilenetv3_large_100",
    head="fpn",
    num_classes=datamodule.num_classes,
)

# 3. Create the trainer and finetune the model
trainer = flash.Trainer(max_epochs=3, gpus=[1])
trainer.finetune(model, datamodule=datamodule, strategy="freeze")

# 4. Segment a few images!
datamodule = SemanticSegmentationData.from_files(
    predict_files=[
        "data/CameraRGB/F61-1.png",
        "data/CameraRGB/F62-1.png",
        "data/CameraRGB/F63-1.png",
    ],
    batch_size=3,
)
predictions = trainer.predict(model, datamodule=datamodule)
print(predictions)

# 5. Save the model!
trainer.save_checkpoint("test/semantic_segmentation_model.pt")

The error I get is


Using 'mobilenetv3_large_100' provided by qubvel/segmentation_models.pytorch (https://github.com/qubvel/segmentation_models.pytorch).
Using 'fpn' provided by qubvel/segmentation_models.pytorch (https://github.com/qubvel/segmentation_models.pytorch).
GPU available: True, used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2,3]

  | Name          | Type               | Params
-----------------------------------------------------
0 | train_metrics | ModuleDict         | 0     
1 | val_metrics   | ModuleDict         | 0     
2 | test_metrics  | ModuleDict         | 0     
3 | head          | FPN                | 4.9 M 
4 | backbone      | MobileNetV3Encoder | 3.0 M 
-----------------------------------------------------
1.9 M     Trainable params
2.9 M     Non-trainable params
4.9 M     Total params
19.561    Total estimated model params size (MB)

Validation sanity check: 0it [00:00, ?it/s]/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:132: UserWarning: The dataloader, val_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 32 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.
  rank_zero_warn(

Validation sanity check:   0%|          | 0/2 [00:00<?, ?it/s]Traceback (most recent call last):
  File "/mnt/data3/WorkingDiruser1/FehlnerA/af017_shinheung/flash_semanticsegmentation.py", line 54, in <module>
    trainer.finetune(model, datamodule=datamodule, strategy="freeze")
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/trainer.py", line 161, in finetune
    return super().fit(model, train_dataloader, val_dataloaders, datamodule)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 740, in fit
    self._call_and_handle_interrupt(
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 685, in _call_and_handle_interrupt
    return trainer_fn(*args, **kwargs)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 777, in _fit_impl
    self._run(model, ckpt_path=ckpt_path)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 1199, in _run
    self._dispatch()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 1279, in _dispatch
    self.training_type_plugin.start_training(self)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/plugins/training_type/training_type_plugin.py", line 202, in start_training
    self._results = trainer.run_stage()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 1289, in run_stage
    return self._run_train()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 1311, in _run_train
    self._run_sanity_check(self.lightning_module)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py", line 1375, in _run_sanity_check
    self._evaluation_loop.run()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/loops/base.py", line 145, in run
    self.advance(*args, **kwargs)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/loops/dataloader/evaluation_loop.py", line 110, in advance
    dl_outputs = self.epoch_loop.run(dataloader, dataloader_idx, dl_max_batches, self.num_dataloaders)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/loops/base.py", line 140, in run
    self.on_run_start(*args, **kwargs)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/loops/epoch/evaluation_epoch_loop.py", line 86, in on_run_start
    self._dataloader_iter = _update_dataloader_iter(data_fetcher, self.batch_progress.current.ready)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/loops/utilities.py", line 121, in _update_dataloader_iter
    dataloader_iter = enumerate(data_fetcher, batch_idx)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/utilities/fetching.py", line 199, in __iter__
    self.prefetching(self.prefetch_batches)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/utilities/fetching.py", line 258, in prefetching
    self._fetch_next_batch()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/utilities/fetching.py", line 300, in _fetch_next_batch
    batch = next(self.dataloader_iter)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/torch/utils/data/dataloader.py", line 521, in __next__
    data = self._next_data()
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/torch/utils/data/dataloader.py", line 561, in _next_data
    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/torch/utils/data/_utils/fetch.py", line 52, in fetch
    return self.collate_fn(data)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/pytorch_lightning/utilities/auto_restart.py", line 474, in _capture_metadata_collate
    data = default_collate(samples)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/data/io/input_transform.py", line 1134, in __call__
    transformed_samples = [self.per_sample_transform(sample) for sample in list_samples]
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/data/io/input_transform.py", line 1134, in <listcomp>
    transformed_samples = [self.per_sample_transform(sample) for sample in list_samples]
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/data/io/input_transform.py", line 52, in wrapper
    result = func(self, *args, **kwargs)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/data/io/input_transform.py", line 839, in _per_sample_transform
    return fn(sample)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1102, in _call_impl
    return forward_call(*input, **kwargs)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/integrations/icevision/transforms.py", line 240, in forward
    record = to_icevision_record(x)
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/flash/core/integrations/icevision/transforms.py", line 78, in to_icevision_record
    input_component.set_img(sample[DataKeys.INPUT])
  File "/home/user1/anaconda3/envs/pyt2/lib/python3.9/site-packages/icevision/core/record_components.py", line 116, in set_img
    assert isinstance(img, (PIL.Image.Image, np.ndarray))
AssertionError

as I understand icevision is not implemented for semantic segmentation task. As it seems to be implemented in instance_segmentation, the code should be transferable to the semantic segmentation functionality?

Another option I tried was https://github.com/PyTorchLightning/lightning-flash#flash-transforms but for I realized that
segmentation/input_transform.py does not have the same functionality as flash.image.classification.input_transform so far.

What would be the next recommended steps?

Integration of Albumentations and Icevision in Flash for Semantic Segmentation?
Separate DataAugmentation outside Flash for Semantic Segmentation? Can someone provide some code fragments which could be integrated in the example above for image augmentations?

ethanwharris · 2022-03-21T12:39:33Z

ethanwharris
Mar 21, 2022
Maintainer

Hi @andife thanks for the question! Here's an example showing how you can use custom transforms from albumentations with the semantic segmentation task:

from functools import partial
from typing import Tuple

import torch
from dataclasses import dataclass

import albumentations as A

import flash
from flash import InputTransform
from flash.core.data.utils import download_data
from flash.image import SemanticSegmentation, SemanticSegmentationData

# 1. Create the DataModule
# The data was generated with the  CARLA self-driving simulator as part of the Kaggle Lyft Udacity Challenge.
# More info here: https://www.kaggle.com/kumaresanmanickavelu/lyft-udacity-challenge
download_data(
    "https://github.com/ongchinkiat/LyftPerceptionChallenge/releases/download/v0.1/carla-capture-20180513A.zip",
    "./data",
)


@dataclass
class CustomTransform(InputTransform):

    image_size: Tuple[int, int] = (300, 300)
    crop_size: Tuple[int, int] = (256, 256)

    def __post_init__(self):
        self.train_transform = A.Compose([
            A.Resize(width=self.image_size[0], height=self.image_size[1]),
            A.RandomCrop(width=self.crop_size[0], height=self.crop_size[1]),
            A.HorizontalFlip(p=0.5),
            A.RandomBrightnessContrast(p=0.2),
        ])

        self.transform = A.Compose([
            A.Resize(width=self.image_size[0], height=self.image_size[1]),
            A.CenterCrop(width=self.crop_size[0], height=self.crop_size[1]),
        ])

        super().__post_init__()

    @staticmethod
    def _apply_transform(transform, sample):
        if "target" in sample:
            kwargs = {
                "mask": sample["target"].numpy()
            }
        else:
            kwargs = {}

        transformed = transform(
            image=sample["input"].permute(1, 2, 0).numpy(),
            **kwargs
        )
        sample["input"] = torch.from_numpy(transformed["image"]).permute(2, 0, 1)

        if "mask" in transformed:
            sample["target"] = torch.from_numpy(transformed["mask"])
        return sample

    def per_sample_transform(self):
        return partial(self._apply_transform, self.transform)

    def train_per_sample_transform(self):
        return partial(self._apply_transform, self.train_transform)

    @staticmethod
    def _prepare_target(target) -> torch.Tensor:
        """Convert the target mask to long and remove the channel dimension."""
        return target.long().squeeze(1)

    def target_per_batch_transform(self):
        return self._prepare_target


datamodule = SemanticSegmentationData.from_folders(
    train_folder="data/CameraRGB",
    train_target_folder="data/CameraSeg",
    val_split=0.1,
    train_transform=CustomTransform,
    val_transform=CustomTransform,
    transform_kwargs=dict(image_size=(300, 300)),
    num_classes=21,
    batch_size=4,
)

# 2. Build the task
model = SemanticSegmentation(
    backbone="mobilenetv3_large_100",
    head="fpn",
    num_classes=datamodule.num_classes,
)

# 3. Create the trainer and finetune the model
trainer = flash.Trainer(max_epochs=3, gpus=torch.cuda.device_count(), fast_dev_run=True)
trainer.finetune(model, datamodule=datamodule, strategy="freeze")

# 4. Segment a few images!
datamodule = SemanticSegmentationData.from_files(
    predict_transform=CustomTransform,
    predict_files=[
        "data/CameraRGB/F61-1.png",
        "data/CameraRGB/F62-1.png",
        "data/CameraRGB/F63-1.png",
    ],
    batch_size=3,
)
predictions = trainer.predict(model, datamodule=datamodule)
print(predictions)

# 5. Save the model!
trainer.save_checkpoint("semantic_segmentation_model.pt")

Hope that helps 😃

0 replies

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Data augmentation for semantic segmentation for flash #1232

Uh oh!

{{title}}

Uh oh!

Replies: 1 comment

Uh oh!

{{title}}

Uh oh!

Select a reply

Uh oh!

Data augmentation for semantic segmentation for flash #1232

Uh oh!

andife Mar 15, 2022

Replies: 1 comment

Uh oh!

ethanwharris Mar 21, 2022 Maintainer

andife
Mar 15, 2022

ethanwharris
Mar 21, 2022
Maintainer