@inproceedings{8108536fd13047f18131cf2aaa1006f9,
title = "Information-Theory interpretation of the skip-Gram negative-Sampling objective function",
abstract = "In this paper, we define a measure of dependency between two random variables, based on the Jensen-Shannon (JS) divergence between their joint distribution and the product of their marginal distributions. Then, we show that word2vec{\textquoteright}s skip-gram with negative sampling embedding algorithm finds the optimal low-dimensional approximation of this JS dependency measure between the words and their contexts. The gap between the optimal score and the low-dimensional approximation is demonstrated on a standard text corpus.",
author = "Jacob Goldberger and Oren Melamud",
note = "Publisher Copyright: {\textcopyright} 2017 Association for Computational Linguistics.; 55th Annual Meeting of the Association for Computational Linguistics, ACL 2017 ; Conference date: 30-07-2017 Through 04-08-2017",
year = "2017",
doi = "10.18653/v1/P17-2026",
language = "الإنجليزيّة",
series = "ACL 2017 - 55th Annual Meeting of the Association for Computational Linguistics, Proceedings of the Conference (Long Papers)",
publisher = "Association for Computational Linguistics (ACL)",
pages = "167--171",
booktitle = "ACL 2017 - 55th Annual Meeting of the Association for Computational Linguistics, Proceedings of the Conference (Short Papers)",
address = "الولايات المتّحدة",
}