{ "id": "2006.03875", "version": "v1", "published": "2020-06-06T14:20:25.000Z", "updated": "2020-06-06T14:20:25.000Z", "title": "Coresets via Bilevel Optimization for Continual Learning and Streaming", "authors": [ "Zalán Borsos", "Mojmír Mutný", "Andreas Krause" ], "categories": [ "cs.LG", "stat.ML" ], "abstract": "Coresets are small data summaries that are sufficient for model training. They can be maintained online, enabling efficient handling of large data streams under resource constraints. However, existing constructions are limited to simple models such as k-means and logistic regression. In this work, we propose a novel coreset construction via cardinality-constrained bilevel optimization. We show how our framework can efficiently generate coresets for deep neural networks, and demonstrate its empirical benefits in continual learning and in streaming settings.", "revisions": [ { "version": "v1", "updated": "2020-06-06T14:20:25.000Z" } ], "analyses": { "keywords": [ "continual learning", "deep neural networks", "large data streams", "novel coreset construction", "small data summaries" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }