@inproceedings{cf46e3aa0c4f4c4683f309b74851743b,
title = "Key-Locked Rank One Editing for Text-to-Image Personalization",
abstract = "Text-to-image models (T2I) offer a new level of flexibility by allowing users to guide the creative process through natural language. However, personalizing these models to align with user-provided visual concepts remains a challenging problem. The task of T2I personalization poses multiple hard challenges, such as maintaining high visual fidelity while allowing creative control, combining multiple personalized concepts in a single image, and keeping a small model size. We present Perfusion, a T2I personalization method that addresses these challenges using dynamic rank-1 updates to the underlying T2I model. Perfusion avoids overfitting by introducing a new mechanism that {"}locks{"}new concepts' cross-attention Keys to their superordinate category. Additionally, we develop a gated rank-1 approach that enables us to control the influence of a learned concept during inference time and to combine multiple concepts. This allows runtime efficient balancing of visual-fidelity and textual-alignment with a single 100KB trained model. Importantly, it can span different operating points across the Pareto front without additional training. We compare our approach to strong baselines and demonstrate its qualitative and quantitative strengths.",
keywords = "Diffusion, Personalization, Rank-One, Text-to-Image",
author = "Yoad Tewel and Rinon Gal and Gal Chechik and Yuval Atzmon",
note = "Publisher Copyright: {\textcopyright} 2023 ACM.; 2023 Special Interest Group on Computer Graphics and Interactive Techniques Conference, SIGGRAPH 2023 ; Conference date: 06-08-2023 Through 10-08-2023",
year = "2023",
month = jul,
day = "23",
doi = "https://doi.org/10.1145/3588432.3591506",
language = "الإنجليزيّة",
series = "Proceedings - SIGGRAPH 2023 Conference Papers",
editor = "Spencer, {Stephen N.}",
booktitle = "Proceedings - SIGGRAPH 2023 Conference Papers",
}