dd/d28/data__sampler_8py_source.html

# encoding: utf-8

"""

@author:  l1aoxingyu

@contact: sherlockliao01@gmail.com

"""

import itertools

from typing import Optional


import numpy as np

from torch.utils.data import Sampler


from fastreid.utils import comm


class TrainingSampler(Sampler):

    """

    In training, we only care about the "infinite stream" of training data.

    So this sampler produces an infinite stream of indices and

    all workers cooperate to correctly shuffle the indices and sample different indices.

    The samplers in each worker effectively produces `indices[worker_id::num_workers]`

    where `indices` is an infinite stream of indices consisting of

    `shuffle(range(size)) + shuffle(range(size)) + ...` (if shuffle is True)

    or `range(size) + range(size) + ...` (if shuffle is False)

    """


    def __init__(self, size: int, shuffle: bool = True, seed: Optional[int] = None):

        """

        Args:

            size (int): the total number of data of the underlying dataset to sample from

            shuffle (bool): whether to shuffle the indices or not

            seed (int): the initial seed of the shuffle. Must be the same

                across all workers. If None, will use a random seed shared

                among workers (require synchronization among all workers).

        """

        self._size = size

        assert size > 0

        self._shuffle = shuffle

        if seed is None:

            seed = comm.shared_random_seed()

        self._seed = int(seed)


        self._rank = comm.get_rank()

        self._world_size = comm.get_world_size()


    def __iter__(self):

        start = self._rank

        yield from itertools.islice(self._infinite_indices(), start, None, self._world_size)


    def _infinite_indices(self):

        np.random.seed(self._seed)

        while True:

            if self._shuffle:

                yield from np.random.permutation(self._size)

            else:

                yield from np.arange(self._size)


class InferenceSampler(Sampler):

    """

    Produce indices for inference.

    Inference needs to run on the __exact__ set of samples,

    therefore when the total number of samples is not divisible by the number of workers,

    this sampler produces different number of samples on different workers.

    """


    def __init__(self, size: int):

        """

        Args:

            size (int): the total number of data of the underlying dataset to sample from

        """

        self._size = size

        assert size > 0

        self._rank = comm.get_rank()

        self._world_size = comm.get_world_size()


        shard_size = (self._size - 1) // self._world_size + 1

        begin = shard_size * self._rank

        end = min(shard_size * (self._rank + 1), self._size)

        self._local_indices = range(begin, end)


    def __iter__(self):

        yield from self._local_indices


    def __len__(self):

        return len(self._local_indices)


fastreid.data.samplers.data_sampler.InferenceSampler
Definition data_sampler.py:58

fastreid.data.samplers.data_sampler.InferenceSampler.__iter__
__iter__(self)
Definition data_sampler.py:81

fastreid.data.samplers.data_sampler.InferenceSampler._local_indices
_local_indices
Definition data_sampler.py:79

fastreid.data.samplers.data_sampler.InferenceSampler._world_size
_world_size
Definition data_sampler.py:74

fastreid.data.samplers.data_sampler.InferenceSampler.__len__
__len__(self)
Definition data_sampler.py:84

fastreid.data.samplers.data_sampler.InferenceSampler._size
_size
Definition data_sampler.py:71

fastreid.data.samplers.data_sampler.InferenceSampler.__init__
__init__(self, int size)
Definition data_sampler.py:66

fastreid.data.samplers.data_sampler.InferenceSampler._rank
_rank
Definition data_sampler.py:73

fastreid.data.samplers.data_sampler.TrainingSampler
Definition data_sampler.py:15

fastreid.data.samplers.data_sampler.TrainingSampler._shuffle
_shuffle
Definition data_sampler.py:37

fastreid.data.samplers.data_sampler.TrainingSampler._infinite_indices
_infinite_indices(self)
Definition data_sampler.py:49

fastreid.data.samplers.data_sampler.TrainingSampler._size
_size
Definition data_sampler.py:35

fastreid.data.samplers.data_sampler.TrainingSampler.__iter__
__iter__(self)
Definition data_sampler.py:45

fastreid.data.samplers.data_sampler.TrainingSampler.__init__
__init__(self, int size, bool shuffle=True, Optional[int] seed=None)
Definition data_sampler.py:26

fastreid.data.samplers.data_sampler.TrainingSampler._rank
_rank
Definition data_sampler.py:42

fastreid.data.samplers.data_sampler.TrainingSampler._world_size
_world_size
Definition data_sampler.py:43

fastreid.data.samplers.data_sampler.TrainingSampler._seed
_seed
Definition data_sampler.py:40

fastreid.utils
Definition __init__.py:1

torch.utils.data