{ "id": "1906.12039", "version": "v1", "published": "2019-06-28T04:41:06.000Z", "updated": "2019-06-28T04:41:06.000Z", "title": "Supervised Contextual Embeddings for Transfer Learning in Natural Language Processing Tasks", "authors": [ "Mihir Kale", "Aditya Siddhant", "Sreyashi Nag", "Radhika Parik", "Matthias Grabmair", "Anthony Tomasic" ], "comment": "Appeared in 2nd Learning from Limited Labeled Data (LLD) Workshop at ICLR 2019", "categories": [ "cs.CL", "cs.LG" ], "abstract": "Pre-trained word embeddings are the primary method for transfer learning in several Natural Language Processing (NLP) tasks. Recent works have focused on using unsupervised techniques such as language modeling to obtain these embeddings. In contrast, this work focuses on extracting representations from multiple pre-trained supervised models, which enriches word embeddings with task and domain specific knowledge. Experiments performed in cross-task, cross-domain and cross-lingual settings indicate that such supervised embeddings are helpful, especially in the low-resource setting, but the extent of gains is dependent on the nature of the task and domain. We make our code publicly available.", "revisions": [ { "version": "v1", "updated": "2019-06-28T04:41:06.000Z" } ], "analyses": { "keywords": [ "natural language processing tasks", "supervised contextual embeddings", "transfer learning", "enriches word embeddings", "domain specific knowledge" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }