@inproceedings{4188352ca8f04144aa2ed87a1aff80b4,
title = "Aligning Alignments: Do Colexification and Distributional Similarity Align as Measures of cross-lingual Lexical Alignment?",
abstract = "The data-driven investigation of the extent to which lexicons of different languages align has mostly fallen into one of two categories: colexification-based and distributional. The two approaches are grounded in distinct methodologies, operate on different assumptions, and are used in diverse ways. This raises two important questions: (a) are there settings in which the predictions of the two approaches can be directly compared? and if so, (b) what is the extent of the similarity and what are its determinants? We offer novel operationalizations for the two approaches in a manner that allows for their direct comparison, and conduct a comprehensive analysis on a diverse set of 16 languages. Our analysis is carried out at different levels of granularity. At the word-level, the two methods present different results across the board. However, intriguingly, at the level of semantic domains (e.g., kinship, quantity), the two methods show considerable convergence in their predictions. Our findings also indicate that the distributional methods likely capture a more fine-grained alignment than their counterpart colexification-based methods, and may thus be more suited for settings where fewer languages are evaluated.",
author = "Taelin Karidi and Eitan Grossman and Omri Abend",
note = "Publisher Copyright: {\textcopyright} 2024 Association for Computational Linguistics.; 28th Conference on Computational Natural Language Learning, CoNLL 2024 ; Conference date: 15-11-2024 Through 16-11-2024",
year = "2024",
language = "الإنجليزيّة",
series = "CoNLL 2024 - 28th Conference on Computational Natural Language Learning, Proceedings of the Conference",
publisher = "Association for Computational Linguistics (ACL)",
pages = "327--341",
editor = "Libby Barak and Malihe Alikhani",
booktitle = "CoNLL 2024 - 28th Conference on Computational Natural Language Learning, Proceedings of the Conference",
address = "الولايات المتّحدة",
}