Source code for easycv.datasets.detection.data_sources.crowd_human

# Copyright (c) OpenMMLab. All rights reserved.

import json
import os
from multiprocessing import cpu_count

import numpy as np

from easycv.datasets.registry import DATASOURCES
from easycv.file import io
from .base import DetSourceBase


def parse_load(source_item, classes):

    img_path, lable_info = source_item

    gt_bboxes = []
    gt_labels = []
    for obj in lable_info:
        bbox = obj['box']
        box = [
            float(bbox[0]),
            float(bbox[1]),
            float(bbox[0] + bbox[2]),
            float(bbox[1] + bbox[3])
        ]
        gt_bboxes.append(box)
        if obj.get('tag') not in classes:
            continue

        gt_labels.append(int(classes.index(obj['tag'])))

    if len(gt_bboxes) == 0:
        gt_bboxes = np.zeros((0, 4), dtype=np.float32)

    img_info = {
        'gt_bboxes': np.array(gt_bboxes, dtype=np.float32),
        'gt_labels': np.array(gt_labels, dtype=np.int64),
        'filename': img_path,
    }

    return img_info


[docs]@DATASOURCES.register_module class DetSourceCrowdHuman(DetSourceBase): CLASSES = ['mask', 'person'] ''' Citation: @article{shao2018crowdhuman, title={CrowdHuman: A Benchmark for Detecting Human in a Crowd}, author={Shao, Shuai and Zhao, Zijian and Li, Boxun and Xiao, Tete and Yu, Gang and Zhang, Xiangyu and Sun, Jian}, journal={arXiv preprint arXiv:1805.00123}, year={2018} } ''' """ data dir is as follows: ``` |- data |-annotation_train.odgt |-images |-273271,1a0d6000b9e1f5b7.jpg |-... ``` Example1: data_source = DetSourceCrowdHuman( ann_file='/your/data/annotation_train.odgt', img_prefix='/your/data/images', classes=${CLASSES} ) """
[docs] def __init__(self, ann_file, img_prefix, gt_op='vbox', classes=CLASSES, cache_at_init=False, cache_on_the_fly=False, parse_fn=parse_load, num_processes=int(cpu_count() / 2), **kwargs) -> None: """ Args: ann_file (str): Path to the annotation file. img_prefix (str): Path to a directory where images are held. gt_op (str): vbox(visible box), fbox(full box), hbox(head box), defalut vbox classes(list): classes defalut=['mask', 'person'] cache_at_init: if set True, will cache in memory in __init__ for faster training cache_on_the_fly: if set True, will cache in memroy during training parse_fn: parse function to parse item of source iterator num_processes: number of processes to parse samples """ self.ann_file = ann_file self.img_prefix = img_prefix self.gt_op = gt_op super(DetSourceCrowdHuman, self).__init__( classes=classes, cache_at_init=cache_at_init, cache_on_the_fly=cache_on_the_fly, parse_fn=parse_fn, num_processes=num_processes)
[docs] def get_source_iterator(self): assert os.path.exists(self.ann_file), f'{self.ann_file} is not exists' assert os.path.exists( self.img_prefix), f'{self.img_prefix} is not exists' imgs_path_list = [] labels_list = [] with io.open(self.ann_file, 'r') as t: lines = t.readlines() for img_info in lines: img_info = json.loads(img_info.strip('\n')) img_path = os.path.join(self.img_prefix, img_info['ID'] + '.jpg') if os.path.exists(img_path): imgs_path_list.append(img_path) labels_list.append([{ 'box': label_info[self.gt_op], 'tag': label_info['tag'] } for label_info in img_info['gtboxes']]) return list(zip(imgs_path_list, labels_list))