@inproceedings{95d71a3250bc4bdeb3af784a57cdc1a4,
title = "Cost-Effective LLM Utilization for Machine Learning Tasks over Tabular Data",
abstract = "Classic machine learning (ML) models excel in modeling tabular datasets but lack broader world knowledge due to the absence of pre-training, an area where Large Language Models (LLMs) stand out. This paper presents an effective method that bridges the gap, leveraging LLMs to enrich tabular data to enhance the performance of classical ML models. Despite the previously limited success of direct LLM application to tabular tasks due to their high computational demands, our approach selectively enriches datasets with essential world knowledge, balancing performance improvement with cost-effectiveness. This work advances the capabilities of traditional ML models and opens new avenues for research at the convergence of classical ML and LLMs, marking the onset of a new era in cost-effective data enrichment.",
keywords = "Data Enrichment, Data Integration, Large Language Models",
author = "Yael Einy and Tova Milo and Slava Novgorodov",
note = "Publisher Copyright: {\textcopyright} 2024 Owner/Author.; 1st Workshop on Governance, Understanding and Integration of Data for Effective and Responsible AI, GUIDE-AI 2024 ; Conference date: 14-06-2024 Through 14-06-2024",
year = "2024",
month = jun,
day = "9",
doi = "10.1145/3665601.3669848",
language = "الإنجليزيّة",
series = "1st Workshop on Governance, Understanding and Integration of Data for Effective and Responsible AI, GUIDE-AI 2024, Co-located with SIGMOD 2024",
pages = "45--49",
booktitle = "1st Workshop on Governance, Understanding and Integration of Data for Effective and Responsible AI, GUIDE-AI 2024, Co-located with SIGMOD 2024",
}