@inproceedings{0cd21439d1aa4d5d861bd5cbfedec7b2,
title = "Spatio-temporal action graph networks",
abstract = "Events defined by the interaction of objects in a scene are often of critical importance; yet important events may have insufficient labeled examples to train a conventional deep model to generalize to future object appearance. Activity recognition models that represent object interactions explicitly have the potential to learn in a more efficient manner than those that represent scenes with global descriptors. We propose a novel inter-object graph representation for activity recognition based on a disentangled graph embedding with direct observation of edge appearance. In contrast to prior efforts, our approach uses explicit appearance for high order relations derived from object-object interaction, formed over regions that are the union of the spatial extent of the constituent objects. We employ a novel factored embedding of the graph structure, disentangling a representation hierarchy formed over spatial dimensions from that found over temporal variation. We demonstrate the effectiveness of our model on the Charades activity recognition benchmark, as well as a new dataset of driving activities focusing on multi-object interactions with near-collision events. Our model offers significantly improved performance compared to baseline approaches without object-graph representations, or with previous graph-based models.",
keywords = "Activity recognition, Autonomous driving, Collisions, Graph neural network",
author = "Roei Herzig and Elad Levi and Huijuan Xu and Hang Gao and Eli Brosh and Xiaolong Wang and Amir Globerson and Trevor Darrell",
note = "Publisher Copyright: {\textcopyright} 2019 IEEE.; 17th IEEE/CVF International Conference on Computer Vision Workshop, ICCVW 2019 ; Conference date: 27-10-2019 Through 28-10-2019",
year = "2019",
month = oct,
doi = "10.1109/ICCVW.2019.00288",
language = "الإنجليزيّة",
series = "Proceedings - 2019 International Conference on Computer Vision Workshop, ICCVW 2019",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "2347--2356",
booktitle = "Proceedings - 2019 International Conference on Computer Vision Workshop, ICCVW 2019",
address = "الولايات المتّحدة",
}