@inproceedings{c89b61286c1549259f5d8b359213cfa1,
title = "A Simple and Efficient Approach for Adaptive Entropy Coding over Large Alphabets",
abstract = "Encoding a sequence of independent symbols over a large alphabet size is a challenging problem with applications in many fields. The most widely used adaptive entropy coding techniques (namely, arithmetic and Huffman coding) are known to achieve an average codeword length which may be significantly greater than the empirical entropy of the sequence, as the alphabet size increases. In this work we introduce an efficient and easy-to-implement method for large alphabet adaptive encoding. We propose a conceptual framework in which a sequence of symbols, over a large alphabet size, is decomposed into multiple 'almost independent' sequences over a smaller alphabet. Then each of these sequences is encoded separately. This way, we allow encoding of small alphabet sequences, at the cost of the 'remaining dependence' among the sequences. We demonstrate the advantages of our suggested scheme through a series of theorems and experiments, showing it reduces both the average codeword length and the compression runtime in many large alphabet setups.",
keywords = "Factorial codes, Independent Component Analysis, Large alphabet source coding",
author = "Amichai Painsky and Saharon Rosset and Meir Feder",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 2016 Data Compression Conference, DCC 2016 ; Conference date: 29-03-2016 Through 01-04-2016",
year = "2016",
month = dec,
day = "15",
doi = "10.1109/DCC.2016.59",
language = "الإنجليزيّة",
series = "Data Compression Conference Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "369--378",
editor = "Marcellin, {Michael W.} and Ali Bilgin and Joan Serra-Sagrista and Storer, {James A.}",
booktitle = "Proceedings - DCC 2016",
address = "الولايات المتّحدة",
}