Source code for easycv.datasets.detection.data_sources.wider_person

# Copyright (c) OpenMMLab. All rights reserved.

import os
from multiprocessing import cpu_count

import numpy as np

from easycv.datasets.registry import DATASOURCES
from easycv.file import io
from .base import DetSourceBase


def parse_txt(source_item, classes):
    img_path, txt_path = source_item
    with io.open(txt_path, 'r') as t:
        label_lines = t.read().splitlines()
        num = int(label_lines[0])
        label_lines = label_lines[1:]
        assert len(label_lines) == num, ' number of boxes is not equal '
        gt_bboxes = []
        gt_labels = []
        for obj in label_lines:
            line = obj.split()
            cls_id = int(line[0]) - 1

            box = (float(line[1]), float(line[2]), float(line[3]),
                   float(line[4]))
            gt_bboxes.append(box)
            gt_labels.append(cls_id)

    if len(gt_bboxes) == 0:
        gt_bboxes = np.zeros((0, 4), dtype=np.float32)

    img_info = {
        'gt_bboxes': np.array(gt_bboxes, dtype=np.float32),
        'gt_labels': np.array(gt_labels, dtype=np.int64),
        'filename': img_path,
    }

    return img_info


[docs]@DATASOURCES.register_module
class DetSourceWiderPerson(DetSourceBase):
    CLASSES = [
        'pedestrians', 'riders', 'partially-visible persons', 'ignore regions',
        'crowd'
    ]
    '''
    dataset_name='Wider Person',
    paper_info=@article{zhang2019widerperson,
    Author = {Zhang, Shifeng and Xie, Yiliang and Wan, Jun and Xia, Hansheng and Li, Stan Z. and Guo, Guodong},
    journal = {IEEE Transactions on Multimedia (TMM)},
    Title = {WiderPerson: A Diverse Dataset for Dense Pedestrian Detection in the Wild},
    Year = {2019}}

    '''
    """
    data dir is as follows:
    ```
    |- data
        |-Images
            |-000040.jpg
            |-...
        |-Annotations
            |-000040.jpg.txt
            |-...
        |-train.txt
        |-val.txt
        |-...

    ```
    Example1:
        data_source = DetSourceWiderPerson(
            path='/your/data/train.txt',
            classes=${VOC_CLASSES},
        )
    Example1:
        data_source = DetSourceWiderPerson(
            path='/your/voc_data/train.txt',
            classes=${CLASSES},
            img_root_path='/your/data/Images',
            img_root_path='/your/data/Annotations'
        )
    """

[docs]    def __init__(self,
                 path,
                 classes=CLASSES,
                 img_root_path=None,
                 label_root_path=None,
                 cache_at_init=False,
                 cache_on_the_fly=False,
                 img_suffix='.jpg',
                 label_suffix='.txt',
                 parse_fn=parse_txt,
                 num_processes=int(cpu_count() / 2),
                 **kwargs) -> None:
        """
        Args:
            path: path of img id list file in root
            classes: classes list
            img_root_path: image dir path, if None, default to detect the image dir by the relative path of the `path`
                according to the WiderPerso data format.
            label_root_path: label dir path, if None, default to detect the label dir by the relative path of the `path`
                according to the WiderPerso data format.
            cache_at_init: if set True, will cache in memory in __init__ for faster training
            cache_on_the_fly: if set True, will cache in memroy during training
            img_suffix: suffix of image file
            label_suffix: suffix of label file
            parse_fn: parse function to parse item of source iterator
            num_processes: number of processes to parse samples
        """

        self.path = path
        self.img_root_path = img_root_path
        self.label_root_path = label_root_path
        self.img_suffix = img_suffix
        self.label_suffix = label_suffix
        super(DetSourceWiderPerson, self).__init__(
            classes=classes,
            cache_at_init=cache_at_init,
            cache_on_the_fly=cache_on_the_fly,
            parse_fn=parse_fn,
            num_processes=num_processes)

[docs]    def get_source_iterator(self):
        assert os.path.exists(self.path), f'{self.path} is not exists'

        if not self.img_root_path:
            self.img_root_path = os.path.join(self.path, '..', 'Images')
        if not self.label_root_path:
            self.label_root_path = os.path.join(self.path, '..', 'Annotations')

        imgs_path_list = []
        labels_path_list = []

        with io.open(self.path, 'r') as t:
            id_lines = t.read().splitlines()
            for id_line in id_lines:
                img_id = id_line.strip()
                if img_id == '':
                    continue
                img_path = os.path.join(self.img_root_path,
                                        img_id + self.img_suffix)

                imgs_path_list.append(img_path)

                label_path = os.path.join(
                    self.label_root_path,
                    img_id + self.img_suffix + self.label_suffix)
                labels_path_list.append(label_path)

        return list(zip(imgs_path_list, labels_path_list))