mmselfsup/openselfsup/datasets/deepcluster.py

35 lines
1.1 KiB
Python
Raw Normal View History

2020-06-24 13:59:02 +08:00
from PIL import Image
2020-06-16 00:05:18 +08:00
from .registry import DATASETS
from .base import BaseDataset
@DATASETS.register_module
class DeepClusterDataset(BaseDataset):
"""Dataset for DC and ODC.
"""
def __init__(self, data_source, pipeline):
super(DeepClusterDataset, self).__init__(data_source, pipeline)
# init clustering labels
self.labels = [-1 for _ in range(self.data_source.get_length())]
def __getitem__(self, idx):
2020-06-17 01:31:59 +08:00
img = self.data_source.get_sample(idx)
assert isinstance(img, Image.Image), \
'The output from the data source must be an Image, got: {}. \
Please ensure that the list file does not contain labels.'.format(
type(img))
2020-06-16 00:05:18 +08:00
label = self.labels[idx]
img = self.pipeline(img)
return dict(img=img, pseudo_label=label, idx=idx)
def assign_labels(self, labels):
assert len(self.labels) == len(labels), \
"Inconsistent lenght of asigned labels, \
{} vs {}".format(len(self.labels), len(labels))
self.labels = labels[:]
def evaluate(self, scores, keyword, logger=None):
raise NotImplemented