{ "id": "1802.06552", "version": "v1", "published": "2018-02-19T08:58:00.000Z", "updated": "2018-02-19T08:58:00.000Z", "title": "Are Generative Classifiers More Robust to Adversarial Attacks?", "authors": [ "Yingzhen Li" ], "comment": "Submitted to ICLR 2018 workshop track, preliminary work, feedback welcome", "categories": [ "cs.LG", "stat.ML" ], "abstract": "There is a rising interest in studying the robustness of deep neural network classifiers against adversaries, with both advanced attack and defence techniques being actively developed. However, most recent work focuses on discriminative classifiers which only models the conditional distribution of the labels given the inputs. In this abstract we propose deep Bayes classifier that improves the classical naive Bayes with conditional deep generative models, and verifies its robustness against a number of existing attacks. We further developed a detection method for adversarial examples based on conditional deep generative models. Our initial results on MNIST suggest that deep Bayes classifiers might be more robust when compared with deep discriminative classifiers, and the proposed detection method achieves high detection rates against two commonly used attacks.", "revisions": [ { "version": "v1", "updated": "2018-02-19T08:58:00.000Z" } ], "analyses": { "keywords": [ "adversarial attacks", "generative classifiers", "conditional deep generative models", "deep bayes classifier", "detection method achieves high detection" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }