{ "id": "1604.00187", "version": "v1", "published": "2016-04-01T10:11:38.000Z", "updated": "2016-04-01T10:11:38.000Z", "title": "PHOCNet: A Deep Convolutional Neural Network for Word Spotting in Handwritten Documents", "authors": [ "Sebastian Sudholt", "Gernot A. Fink" ], "comment": "submitted to ICFHR 2016", "categories": [ "cs.CV" ], "abstract": "In recent years, deep convolutional neural networks have achieved state of the art performance in various computer vision task such as classification, detection or segmentation. Due to their outstanding performance, CNNs are more and more used in the field of document image analysis as well. In this work, we present a CNN architecture that is trained with the recently proposed PHOC representation. We show empirically that our CNN architecture is able to outperform state of the art results for various word spotting benchmarks while exhibiting short training and test times.", "revisions": [ { "version": "v1", "updated": "2016-04-01T10:11:38.000Z" } ], "analyses": { "keywords": [ "deep convolutional neural network", "word spotting", "handwritten documents", "cnn architecture", "computer vision task" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable", "adsabs": "2016arXiv160400187S" } } }