@inproceedings{655f844b244d4651a5acc73342efb104,
title = "Incorporating temporal context in Bag-of-Words models",
abstract = "Bag-of-Words (BoW) is a highly popular model for recognition, due to its robustness and simplicity. Its modeling capabilities, however, are somewhat limited since it discards the spatial and temporal order of the codewords. In this paper we propose a new model: Contextual Sequence of Words (CSoW) which incorporates temporal order into the BoW model for video representation. The temporal context is incorporated in three scales that capture different aspects of the variability between different performances of the same action. We show that using CSoW instead of BoW leads to a significant improvement in action recognition rates, on several different setups.",
author = "Tamar Glaser and Lihi Zelnik-Manor",
year = "2011",
doi = "10.1109/ICCVW.2011.6130436",
language = "الإنجليزيّة",
isbn = "9781467300629",
series = "Proceedings of the IEEE International Conference on Computer Vision",
pages = "1562--1569",
booktitle = "2011 IEEE International Conference on Computer Vision Workshops, ICCV Workshops 2011",
note = "2011 IEEE International Conference on Computer Vision Workshops, ICCV Workshops 2011 ; Conference date: 06-11-2011 Through 13-11-2011",
}