Creative Commons Attribution 4.0 International license
We study the problem of finding a fair linear scoring function over (numerical) attributes for top-k selection, ensuring fairness through a proportional representation constraint on the protected group. Existing algorithms do not scale efficiently, particularly in higher dimensions. Our hardness analysis shows that in more than two dimensions, no algorithm is likely to scale efficiently with respect to dataset size, and the computational complexity is likely to grow rapidly with dimensionality. However, the hardness results also provide key insights guiding algorithm design, leading to our two-pronged solution: (1) For small k, our analysis reveals a gap in the hardness barrier. By addressing various engineering challenges, including achieving efficient parallelism, we turn this potential of efficiency into an optimized geometry-based algorithm delivering substantial performance gains. (2) For large k, where the hardness is robust, we employ a practically efficient optimization-based algorithm which, despite being theoretically worse, achieves superior real-world performance. Experimental evaluations on real-world datasets then explore scenarios where worst-case behavior does not manifest, identifying areas critical to practical performance. Our solution achieves speedups of up to several orders of magnitude compared to the state of the art, an efficiency made possible through a tight integration of hardness analysis, algorithm design, practical engineering, and empirical evaluation.
@InProceedings{cai:LIPIcs.SoCG.2026.26,
author = {Cai, Guangya},
title = {{Finding a Fair Scoring Function for Top-k Selection: From Hardness to Practice}},
booktitle = {42nd International Symposium on Computational Geometry (SoCG 2026)},
pages = {26:1--26:17},
series = {Leibniz International Proceedings in Informatics (LIPIcs)},
ISBN = {978-3-95977-418-5},
ISSN = {1868-8969},
year = {2026},
volume = {367},
editor = {Ahn, Hee-Kap and Hoffmann, Michael and Nayyeri, Amir},
publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik},
address = {Dagstuhl, Germany},
URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.SoCG.2026.26},
URN = {urn:nbn:de:0030-drops-258320},
doi = {10.4230/LIPIcs.SoCG.2026.26},
annote = {Keywords: Fairness, Top-k, Integration}
}
archived version