@inproceedings{ed80ae614f5142e6946cfb6387aa34cd,
title = "Stop: A Dataset for Spoken Task Oriented Semantic Parsing",
abstract = "End-to-end spoken language understanding (SLU) predicts intent directly from audio using a single model. It promises to improve the performance of assistant systems by leveraging acoustic information lost in the intermediate textual representation and preventing cascading errors from Automatic Speech Recognition (ASR). Further, having one unified model has efficiency advantages when deploying assistant systems on-device. However, the limited number of public audio datasets with semantic parse labels hinders the research progress in this area. In this paper, we release the Spoken Task-Oriented semantic Parsing (STOP) dataset 1, the largest and most complex SLU dataset publicly available. Additionally, we define low-resource splits to establish a benchmark for improving SLU when limited labeled data is available. Furthermore, in addition to the human-recorded audio, we are releasing a TTS-generated versions to benchmark the performance for low-resource and domain adaptation of end-to-end SLU systems.",
keywords = "assistant, domain adaptation, spoken language understanding",
author = "Paden Tomasello and Akshat Shrivastava and Daniel Lazar and Hsu, {Po Chun} and Duc Le and Adithya Sagar and Ali Elkahky and Jade Copet and Hsu, {Wei Ning} and Yossi Adi and Robin Algayres and Nguyen, {Tu Ahn} and Emmanuel Dupoux and Luke Zettlemoyer and Abdelrahman Mohamed",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 2022 IEEE Spoken Language Technology Workshop, SLT 2022 ; Conference date: 09-01-2023 Through 12-01-2023",
year = "2023",
doi = "https://doi.org/10.1109/SLT54892.2023.10022703",
language = "الإنجليزيّة",
series = "2022 IEEE Spoken Language Technology Workshop, SLT 2022 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "991--998",
booktitle = "2022 IEEE Spoken Language Technology Workshop, SLT 2022 - Proceedings",
address = "الولايات المتّحدة",
}