Creative Commons Attribution 3.0 Unported license
We propose a new setting for testing properties of distributions while receiving samples from several distributions, but few samples per distribution. Given samples from s distributions, p_1, p_2, …, p_s, we design testers for the following problems: (1) Uniformity Testing: Testing whether all the p_i’s are uniform or ε-far from being uniform in ℓ_1-distance (2) Identity Testing: Testing whether all the p_i’s are equal to an explicitly given distribution q or ε-far from q in ℓ_1-distance, and (3) Closeness Testing: Testing whether all the p_i’s are equal to a distribution q which we have sample access to, or ε-far from q in ℓ_1-distance. By assuming an additional natural condition about the source distributions, we provide sample optimal testers for all of these problems.
@InProceedings{aliakbarpour_et_al:LIPIcs.ITCS.2020.69,
author = {Aliakbarpour, Maryam and Silwal, Sandeep},
title = {{Testing Properties of Multiple Distributions with Few Samples}},
booktitle = {11th Innovations in Theoretical Computer Science Conference (ITCS 2020)},
pages = {69:1--69:41},
series = {Leibniz International Proceedings in Informatics (LIPIcs)},
ISBN = {978-3-95977-134-4},
ISSN = {1868-8969},
year = {2020},
volume = {151},
editor = {Vidick, Thomas},
publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik},
address = {Dagstuhl, Germany},
URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.ITCS.2020.69},
URN = {urn:nbn:de:0030-drops-117545},
doi = {10.4230/LIPIcs.ITCS.2020.69},
annote = {Keywords: Hypothesis Testing, Property Testing, Distribution Testing, Identity Testing, Closeness Testing, Multiple Sources}
}