@inproceedings{8ca8ae9eefcd43ccbe0937cb237c08e6,
title = "Self-normalization properties of language modeling",
abstract = "Self-normalizing discriminative models approximate the normalized probability of a class without having to compute the partition function. In the context of language modeling, this property is particularly appealing as it may significantly reduce run-times due to large word vocabularies. In this study, we provide a comprehensive investigation of language modeling self-normalization. First, we theoretically analyze the inherent self-normalization properties of Noise Contrastive Estimation (NCE) language models. Then, we compare them empirically to softmax-based approaches, which are self-normalized using explicit regularization, and suggest a hybrid model with compelling properties. Finally, we uncover a surprising negative correlation between self-normalization and perplexity across the board, as well as some regularity in the observed errors, which may potentially be used for improving self-normalization algorithms in the future.",
author = "Jacob Goldberger and Oren Melamud",
note = "Publisher Copyright: {\textcopyright} 2018 COLING 2018 - 27th International Conference on Computational Linguistics, Proceedings. All rights reserved.; 27th International Conference on Computational Linguistics, COLING 2018 ; Conference date: 20-08-2018 Through 26-08-2018",
year = "2018",
language = "الإنجليزيّة",
series = "COLING 2018 - 27th International Conference on Computational Linguistics, Proceedings",
publisher = "Association for Computational Linguistics (ACL)",
pages = "764--773",
editor = "Bender, \{Emily M.\} and Leon Derczynski and Pierre Isabelle",
booktitle = "COLING 2018 - 27th International Conference on Computational Linguistics, Proceedings",
address = "الولايات المتّحدة",
}