{ "id": "1609.07916", "version": "v1", "published": "2016-09-26T10:33:13.000Z", "updated": "2016-09-26T10:33:13.000Z", "title": "Deep Structured Features for Semantic Segmentation", "authors": [ "Michael Tschannen", "Lukas Cavigelli", "Fabian Mentzer", "Thomas Wiatowski", "Luca Benini" ], "comment": "10 pages, 2 figures", "categories": [ "cs.CV", "cs.LG" ], "abstract": "We propose a highly structured neural network architecture for semantic segmentation of images that combines i) a Haar wavelet-based tree-like convolutional neural network (CNN), ii) a random layer realizing a radial basis function kernel approximation, and iii) a linear classifier. While stages i) and ii) are completely pre-specified, only the linear classifier is learned from data. Thanks to its high degree of structure, our architecture has a very small memory footprint and thus fits onto low-power embedded and mobile platforms. We apply the proposed architecture to outdoor scene and aerial image semantic segmentation and show that the accuracy of our architecture is competitive with conventional pixel classification CNNs. Furthermore, we demonstrate that the proposed architecture is data efficient in the sense of matching the accuracy of pixel classification CNNs when trained on a much smaller data set.", "revisions": [ { "version": "v1", "updated": "2016-09-26T10:33:13.000Z" } ], "analyses": { "keywords": [ "semantic segmentation", "deep structured features", "structured neural network architecture", "tree-like convolutional neural network", "wavelet-based tree-like convolutional neural" ], "note": { "typesetting": "TeX", "pages": 10, "language": "en", "license": "arXiv", "status": "editable" } } }