We define a new entropy measure L(𝒮), called the containment entropy, for a set 𝒮 of sets, which considers the fact that some sets can be contained in others. We show how to represent 𝒮 within space close to L(𝒮) so that any element of any set can be retrieved in logarithmic time. We extend the result to predecessor and successor queries and show how some common set operations can be implemented efficiently.
@InProceedings{alanko_et_al:OASIcs.Grossi.6, author = {Alanko, Jarno N. and Bille, Philip and G{\o}rtz, Inge Li and Navarro, Gonzalo and Puglisi, Simon J.}, title = {{Compact Data Structures for Collections of Sets}}, booktitle = {From Strings to Graphs, and Back Again: A Festschrift for Roberto Grossi's 60th Birthday}, pages = {6:1--6:7}, series = {Open Access Series in Informatics (OASIcs)}, ISBN = {978-3-95977-391-1}, ISSN = {2190-6807}, year = {2025}, volume = {132}, editor = {Conte, Alessio and Marino, Andrea and Rosone, Giovanna and Vitter, Jeffrey Scott}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/OASIcs.Grossi.6}, URN = {urn:nbn:de:0030-drops-238051}, doi = {10.4230/OASIcs.Grossi.6}, annote = {Keywords: Compressed data structures, entropy of sets, data compression} }
Feedback for Dagstuhl Publishing