{ "id": "1804.03782", "version": "v1", "published": "2018-04-11T02:10:55.000Z", "updated": "2018-04-11T02:10:55.000Z", "title": "CoT: Cooperative Training for Generative Modeling", "authors": [ "Sidi Lu", "Lantao Yu", "Weinan Zhang", "Yong Yu" ], "categories": [ "cs.LG", "cs.AI", "cs.CL", "stat.ML" ], "abstract": "We propose Cooperative Training (CoT) for training generative models that measure a tractable density function for target data. CoT coordinately trains a generator $G$ and an auxiliary predictive mediator $M$. The training target of $M$ is to estimate a mixture density of the learned distribution $G$ and the target distribution $P$, and that of $G$ is to minimize the Jensen-Shannon divergence estimated through $M$. CoT achieves independent success without the necessity of pre-training via Maximum Likelihood Estimation or involving high-variance algorithms like REINFORCE. This low-variance algorithm is theoretically proved to be unbiased for both generative and predictive tasks. We also theoretically and empirically show the superiority of CoT over most previous algorithms, in terms of generative quality and diversity, predictive generalization ability and computational cost.", "revisions": [ { "version": "v1", "updated": "2018-04-11T02:10:55.000Z" } ], "analyses": { "keywords": [ "cooperative training", "generative modeling", "cot achieves independent success", "maximum likelihood estimation", "mixture density" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }