mmsegmentation/mmseg/datasets/pipelines/loading.py

# Copyright (c) OpenMMLab. All rights reserved.
import os.path as osp

import mmcv
import numpy as np

from ..builder import PIPELINES


@PIPELINES.register_module()
class LoadImageFromFile(object):
    """Load an image from file.

    Required keys are "img_prefix" and "img_info" (a dict that must contain the
    key "filename"). Added or updated keys are "filename", "img", "img_shape",
    "ori_shape" (same as `img_shape`), "pad_shape" (same as `img_shape`),
    "scale_factor" (1.0) and "img_norm_cfg" (means=0 and stds=1).

    Args:
        to_float32 (bool): Whether to convert the loaded image to a float32
            numpy array. If set to False, the loaded image is an uint8 array.
            Defaults to False.
        color_type (str): The flag argument for :func:`mmcv.imfrombytes`.
            Defaults to 'color'.
        file_client_args (dict): Arguments to instantiate a FileClient.
            See :class:`mmcv.fileio.FileClient` for details.
            Defaults to ``dict(backend='disk')``.
        imdecode_backend (str): Backend for :func:`mmcv.imdecode`. Default:
            'cv2'
    """

    def __init__(self,
                 to_float32=False,
                 color_type='color',
                 file_client_args=dict(backend='disk'),
                 imdecode_backend='cv2'):
        self.to_float32 = to_float32
        self.color_type = color_type
        self.file_client_args = file_client_args.copy()
        self.file_client = None
        self.imdecode_backend = imdecode_backend

    def __call__(self, results):
        """Call functions to load image and get image meta information.

        Args:
            results (dict): Result dict from :obj:`mmseg.CustomDataset`.

        Returns:
            dict: The dict contains loaded image and meta information.
        """

        if self.file_client is None:
            self.file_client = mmcv.FileClient(**self.file_client_args)

        if results.get('img_prefix') is not None:
            filename = osp.join(results['img_prefix'],
                                results['img_info']['filename'])
        else:
            filename = results['img_info']['filename']
        img_bytes = self.file_client.get(filename)
        img = mmcv.imfrombytes(
            img_bytes, flag=self.color_type, backend=self.imdecode_backend)
        if self.to_float32:
            img = img.astype(np.float32)

        results['filename'] = filename
        results['ori_filename'] = results['img_info']['filename']
        results['img'] = img
        results['img_shape'] = img.shape
        results['ori_shape'] = img.shape
        # Set initial values for default meta_keys
        results['pad_shape'] = img.shape
        results['scale_factor'] = 1.0
        num_channels = 1 if len(img.shape) < 3 else img.shape[2]
        results['img_norm_cfg'] = dict(
            mean=np.zeros(num_channels, dtype=np.float32),
            std=np.ones(num_channels, dtype=np.float32),
            to_rgb=False)
        return results

    def __repr__(self):
        repr_str = self.__class__.__name__
        repr_str += f'(to_float32={self.to_float32},'
        repr_str += f"color_type='{self.color_type}',"
        repr_str += f"imdecode_backend='{self.imdecode_backend}')"
        return repr_str


@PIPELINES.register_module()
class LoadAnnotations(object):
    """Load annotations for semantic segmentation.

    Args:
        reduce_zero_label (bool): Whether reduce all label value by 1.
            Usually used for datasets where 0 is background label.
            Default: False.
        file_client_args (dict): Arguments to instantiate a FileClient.
            See :class:`mmcv.fileio.FileClient` for details.
            Defaults to ``dict(backend='disk')``.
        imdecode_backend (str): Backend for :func:`mmcv.imdecode`. Default:
            'pillow'
    """

    def __init__(self,
                 reduce_zero_label=False,
                 file_client_args=dict(backend='disk'),
                 imdecode_backend='pillow'):
        self.reduce_zero_label = reduce_zero_label
        self.file_client_args = file_client_args.copy()
        self.file_client = None
        self.imdecode_backend = imdecode_backend

    def __call__(self, results):
        """Call function to load multiple types annotations.

        Args:
            results (dict): Result dict from :obj:`mmseg.CustomDataset`.

        Returns:
            dict: The dict contains loaded semantic segmentation annotations.
        """

        if self.file_client is None:
            self.file_client = mmcv.FileClient(**self.file_client_args)

        if results.get('seg_prefix', None) is not None:
            filename = osp.join(results['seg_prefix'],
                                results['ann_info']['seg_map'])
        else:
            filename = results['ann_info']['seg_map']
        img_bytes = self.file_client.get(filename)
        gt_semantic_seg = mmcv.imfrombytes(
            img_bytes, flag='unchanged',
            backend=self.imdecode_backend).squeeze().astype(np.uint8)
        # reduce zero_label
        if self.reduce_zero_label:
            # avoid using underflow conversion
            gt_semantic_seg[gt_semantic_seg == 0] = 255
            gt_semantic_seg = gt_semantic_seg - 1
            gt_semantic_seg[gt_semantic_seg == 254] = 255
        # modify if custom classes
        if results.get('label_map', None) is not None:
            # Add deep copy to solve bug of repeatedly
            # replace `gt_semantic_seg`, which is reported in
            # https://github.com/open-mmlab/mmsegmentation/pull/1445/
            gt_semantic_seg_copy = gt_semantic_seg.copy()
            for old_id, new_id in results['label_map'].items():
                gt_semantic_seg[gt_semantic_seg_copy == old_id] = new_id
        results['gt_semantic_seg'] = gt_semantic_seg
        results['seg_fields'].append('gt_semantic_seg')
        return results

    def __repr__(self):
        repr_str = self.__class__.__name__
        repr_str += f'(reduce_zero_label={self.reduce_zero_label},'
        repr_str += f"imdecode_backend='{self.imdecode_backend}')"
        return repr_str
[Dcos] Add header for files (#796) * Add header for files * Delete header in config files 2021-08-17 14:16:55 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
init commit 2020-07-07 20:52:19 +08:00			`import os.path as osp`

			`import mmcv`
			`import numpy as np`

			`from ..builder import PIPELINES`


			`@PIPELINES.register_module()`
			`class LoadImageFromFile(object):`
			`"""Load an image from file.`

			`Required keys are "img_prefix" and "img_info" (a dict that must contain the`
			`key "filename"). Added or updated keys are "filename", "img", "img_shape",`
			"ori_shape" (same as `img_shape`), "pad_shape" (same as `img_shape`),
			`"scale_factor" (1.0) and "img_norm_cfg" (means=0 and stds=1).`

			`Args:`
			`to_float32 (bool): Whether to convert the loaded image to a float32`
			`numpy array. If set to False, the loaded image is an uint8 array.`
			`Defaults to False.`
			color_type (str): The flag argument for :func:`mmcv.imfrombytes`.
			`Defaults to 'color'.`
			`file_client_args (dict): Arguments to instantiate a FileClient.`
			See :class:`mmcv.fileio.FileClient` for details.
			Defaults to ``dict(backend='disk')``.
			imdecode_backend (str): Backend for :func:`mmcv.imdecode`. Default:
			`'cv2'`
			`"""`

			`def __init__(self,`
			`to_float32=False,`
			`color_type='color',`
			`file_client_args=dict(backend='disk'),`
			`imdecode_backend='cv2'):`
			`self.to_float32 = to_float32`
			`self.color_type = color_type`
			`self.file_client_args = file_client_args.copy()`
			`self.file_client = None`
			`self.imdecode_backend = imdecode_backend`

			`def __call__(self, results):`
			`"""Call functions to load image and get image meta information.`

			`Args:`
			results (dict): Result dict from :obj:`mmseg.CustomDataset`.

			`Returns:`
			`dict: The dict contains loaded image and meta information.`
			`"""`

			`if self.file_client is None:`
			`self.file_client = mmcv.FileClient(**self.file_client_args)`

			`if results.get('img_prefix') is not None:`
			`filename = osp.join(results['img_prefix'],`
			`results['img_info']['filename'])`
			`else:`
			`filename = results['img_info']['filename']`
			`img_bytes = self.file_client.get(filename)`
			`img = mmcv.imfrombytes(`
			`img_bytes, flag=self.color_type, backend=self.imdecode_backend)`
			`if self.to_float32:`
			`img = img.astype(np.float32)`

			`results['filename'] = filename`
			`results['ori_filename'] = results['img_info']['filename']`
			`results['img'] = img`
			`results['img_shape'] = img.shape`
			`results['ori_shape'] = img.shape`
			`# Set initial values for default meta_keys`
			`results['pad_shape'] = img.shape`
			`results['scale_factor'] = 1.0`
			`num_channels = 1 if len(img.shape) < 3 else img.shape[2]`
			`results['img_norm_cfg'] = dict(`
			`mean=np.zeros(num_channels, dtype=np.float32),`
			`std=np.ones(num_channels, dtype=np.float32),`
			`to_rgb=False)`
			`return results`

			`def __repr__(self):`
			`repr_str = self.__class__.__name__`
			`repr_str += f'(to_float32={self.to_float32},'`
			`repr_str += f"color_type='{self.color_type}',"`
			`repr_str += f"imdecode_backend='{self.imdecode_backend}')"`
			`return repr_str`


			`@PIPELINES.register_module()`
			`class LoadAnnotations(object):`
			`"""Load annotations for semantic segmentation.`

			`Args:`
change 'reduct' to 'reduce' (#298) 2020-12-14 02:06:01 +08:00			`reduce_zero_label (bool): Whether reduce all label value by 1.`
init commit 2020-07-07 20:52:19 +08:00			`Usually used for datasets where 0 is background label.`
			`Default: False.`
			`file_client_args (dict): Arguments to instantiate a FileClient.`
			See :class:`mmcv.fileio.FileClient` for details.
			Defaults to ``dict(backend='disk')``.
			imdecode_backend (str): Backend for :func:`mmcv.imdecode`. Default:
			`'pillow'`
			`"""`

			`def __init__(self,`
			`reduce_zero_label=False,`
			`file_client_args=dict(backend='disk'),`
			`imdecode_backend='pillow'):`
			`self.reduce_zero_label = reduce_zero_label`
			`self.file_client_args = file_client_args.copy()`
			`self.file_client = None`
			`self.imdecode_backend = imdecode_backend`

			`def __call__(self, results):`
			`"""Call function to load multiple types annotations.`

			`Args:`
			results (dict): Result dict from :obj:`mmseg.CustomDataset`.

			`Returns:`
			`dict: The dict contains loaded semantic segmentation annotations.`
			`"""`

			`if self.file_client is None:`
			`self.file_client = mmcv.FileClient(**self.file_client_args)`

			`if results.get('seg_prefix', None) is not None:`
			`filename = osp.join(results['seg_prefix'],`
			`results['ann_info']['seg_map'])`
			`else:`
			`filename = results['ann_info']['seg_map']`
			`img_bytes = self.file_client.get(filename)`
			`gt_semantic_seg = mmcv.imfrombytes(`
			`img_bytes, flag='unchanged',`
			`backend=self.imdecode_backend).squeeze().astype(np.uint8)`
[Fix] Switch order of `reduce_zero_label` and applying `label_map` (#2500) ## Motivation I want to fix a bug through this PR. The bug occurs when two options -- `reduce_zero_label=True`, and custom classes are used. `reduce_zero_label` remaps the GT seg labels by remapping the zero-class to 255 which is ignored. Conceptually, this should occur before the `label_map` is applied, which maps already reduced labels. However, currently, the `label_map` is applied before the zero label is reduced. ## Modification The modification is simple: - I've just interchanged the order of the two operations by moving 4 lines from bottom to top. - I've added a test that passes when the fix is introduced, and fails on the original `master` branch. ## BC-breaking (Optional) I do not anticipate this change braking any backward-compatibility. ## Checklist - [x] Pre-commit or other linting tools are used to fix the potential lint issues. - _I've fixed all linting/pre-commit errors._ - [x] The modification is covered by complete unit tests. If not, please add more unit test to ensure the correctness. - _I've added a unit test._ - [x] If the modification has potential influence on downstream projects, this PR should be tested with downstream projects, like MMDet or MMDet3D. - _I don't think this change affects MMDet or MMDet3D._ - [x] The documentation has been modified accordingly, like docstring or example tutorials. - _This change fixes an existing bug and doesn't require modifying any documentation/docstring._ 2023-01-19 02:01:40 -05:00			`# reduce zero_label`
			`if self.reduce_zero_label:`
			`# avoid using underflow conversion`
			`gt_semantic_seg[gt_semantic_seg == 0] = 255`
			`gt_semantic_seg = gt_semantic_seg - 1`
			`gt_semantic_seg[gt_semantic_seg == 254] = 255`
Add support for custom classes (#71) * Support for custom classes * Fix test * Fix pre-commit * Add pipeline logic for custom classes * Fix minor issues, fix test * Fix issues from PR review * Fix tests * Remove palette as str * Rename old_to_new_ids to label_map * Test for load_anns * Remove get_palette function * fixed temp * Add subset of palette, remove palette as arg * minor update Co-authored-by: Jiarui XU <xvjiarui0826@gmail.com> 2020-09-16 15:33:01 +02:00			`# modify if custom classes`
			`if results.get('label_map', None) is not None:`
fix bug about label_map (#1445) * fix bug about label_map * Update mmseg/datasets/pipelines/loading.py Co-authored-by: MengzhangLI <mcmong@pku.edu.cn> * lint Co-authored-by: MengzhangLI <mcmong@pku.edu.cn> Co-authored-by: MeowZheng <meowzheng@outlook.com> 2022-04-09 21:11:47 +08:00			`# Add deep copy to solve bug of repeatedly`
			# replace `gt_semantic_seg`, which is reported in
			`# https://github.com/open-mmlab/mmsegmentation/pull/1445/`
			`gt_semantic_seg_copy = gt_semantic_seg.copy()`
Add support for custom classes (#71) * Support for custom classes * Fix test * Fix pre-commit * Add pipeline logic for custom classes * Fix minor issues, fix test * Fix issues from PR review * Fix tests * Remove palette as str * Rename old_to_new_ids to label_map * Test for load_anns * Remove get_palette function * fixed temp * Add subset of palette, remove palette as arg * minor update Co-authored-by: Jiarui XU <xvjiarui0826@gmail.com> 2020-09-16 15:33:01 +02:00			`for old_id, new_id in results['label_map'].items():`
fix bug about label_map (#1445) * fix bug about label_map * Update mmseg/datasets/pipelines/loading.py Co-authored-by: MengzhangLI <mcmong@pku.edu.cn> * lint Co-authored-by: MengzhangLI <mcmong@pku.edu.cn> Co-authored-by: MeowZheng <meowzheng@outlook.com> 2022-04-09 21:11:47 +08:00			`gt_semantic_seg[gt_semantic_seg_copy == old_id] = new_id`
init commit 2020-07-07 20:52:19 +08:00			`results['gt_semantic_seg'] = gt_semantic_seg`
			`results['seg_fields'].append('gt_semantic_seg')`
			`return results`

			`def __repr__(self):`
			`repr_str = self.__class__.__name__`
			`repr_str += f'(reduce_zero_label={self.reduce_zero_label},'`
			`repr_str += f"imdecode_backend='{self.imdecode_backend}')"`
			`return repr_str`