@inproceedings{416728a030a54611a48c250ca9876470,
title = "Multi-modal deep clustering: Unsupervised partitioning of images",
abstract = "The clustering of unlabeled raw images is a daunting task, which has recently been approached with some success by deep learning methods. Here we propose an unsupervised clustering framework, which learns a deep neural network in an end-to-end fashion, providing direct cluster assignments of images without additional processing. Multi-Modal Deep Clustering (MMDC), trains a deep network to align its image embeddings with target points sampled from a Gaussian Mixture Model distribution. The cluster assignments are then determined by mixture component association of image embeddings. Simultaneously, the same deep network is trained to solve an additional self-supervised task of predicting image rotations. This pushes the network to learn more meaningful image representations that facilitate a better clustering. Experimental results show that MMDC achieves or exceeds state-of-the-art performance on six challenging benchmarks. On natural image datasets we improve on previous results with significant margins of up to 20\% absolute accuracy points, yielding an accuracy of 82\% on CIFAR-10, 45\% on CIFAR-100 and 69\% on STL-10.",
author = "Guy Shiran and Daphna Weinshall",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE; 25th International Conference on Pattern Recognition, ICPR 2020 ; Conference date: 10-01-2021 Through 15-01-2021",
year = "2020",
doi = "10.1109/ICPR48806.2021.9411916",
language = "الإنجليزيّة",
series = "Proceedings - International Conference on Pattern Recognition",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "4728--4735",
booktitle = "Proceedings of ICPR 2020 - 25th International Conference on Pattern Recognition",
address = "الولايات المتّحدة",
}