Prefix-Free Parsing (PFP) and its recursive variant (RPFP) provide a scalable framework for compressing and indexing large genomic datasets. By enabling efficient construction of succinct data structures, these methods support fast and memory-efficient read alignment across thousands of genomes. Their deterministic and modular design makes them especially well-suited for pangenomics and large-scale sequence analysis.
@InProceedings{boucher:LIPIcs.WABI.2025.1, author = {Boucher, Christina}, title = {{Recursive Parsing and Grammar Compression in the Era of Pangenomics}}, booktitle = {25th International Conference on Algorithms for Bioinformatics (WABI 2025)}, pages = {1:1--1:2}, series = {Leibniz International Proceedings in Informatics (LIPIcs)}, ISBN = {978-3-95977-386-7}, ISSN = {1868-8969}, year = {2025}, volume = {344}, editor = {Brejov\'{a}, Bro\v{n}a and Patro, Rob}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.WABI.2025.1}, URN = {urn:nbn:de:0030-drops-239278}, doi = {10.4230/LIPIcs.WABI.2025.1}, annote = {Keywords: Prefix-Free Parsing, Recursive Prefix-Free Parsing, Grammar-Based Compression, Succinct Data Structures, RePair Compression} }
Feedback for Dagstuhl Publishing