Creative Commons Attribution 3.0 Unported license
In this paper, we consider the distributed version of Support Vector Machine (SVM) under the coordinator model, where all input data (i.e., points in R^d space) of SVM are arbitrarily distributed among k nodes in some network with a coordinator which can communicate with all nodes. We investigate two variants of this problem, with and without outliers. For distributed SVM without outliers, we prove a lower bound on the communication complexity and give a distributed (1-epsilon)-approximation algorithm to reach this lower bound, where epsilon is a user specified small constant. For distributed SVM with outliers, we present a (1-epsilon)-approximation algorithm to explicitly remove the influence of outliers. Our algorithm is based on a deterministic distributed top t selection algorithm with communication complexity of O(k log (t)) in the coordinator model. Experimental results on benchmark datasets confirm the theoretical guarantees of our algorithms.
@InProceedings{liu_et_al:LIPIcs.ISAAC.2016.54,
author = {Liu, Yangwei and Ding, Hu and Huang, Ziyun and Xu, Jinhui},
title = {{Distributed and Robust Support Vector Machine}},
booktitle = {27th International Symposium on Algorithms and Computation (ISAAC 2016)},
pages = {54:1--54:13},
series = {Leibniz International Proceedings in Informatics (LIPIcs)},
ISBN = {978-3-95977-026-2},
ISSN = {1868-8969},
year = {2016},
volume = {64},
editor = {Hong, Seok-Hee},
publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik},
address = {Dagstuhl, Germany},
URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.ISAAC.2016.54},
URN = {urn:nbn:de:0030-drops-68221},
doi = {10.4230/LIPIcs.ISAAC.2016.54},
annote = {Keywords: Distributed Algorithm, Communication Complexity, Robust Algorithm, SVM}
}