@article{9240598d02ef4bfc9b921d82f2be6a90,
title = "Robust object recognition with cortex-like mechanisms",
abstract = "We introduce a new general framework for the recognition of complex visual scenes, which is motivated by biology: We describe a hierarchical system that closely follows the organization of visual cortex and builds an increasingly complex and invariant feature representation by alternating between a template matching and a maximum pooling operation. We demonstrate the strength of the approach on a range of recognition tasks: From invariant single object recognition in clutter to multiclass categorization problems and complex scene understanding tasks that rely on the recognition of both shape-based as well as texture-based objects. Given the biological constraints that the system had to satisfy, the approach performs surprisingly well: It has the capability of learning from only a few training examples and competes with state-of-the-art systems. We also discuss the existence of a universal, redundant dictionary of features that could handle the recognition of most object categories. In addition to its relevance for computer vision, the success of this approach suggests a plausibility proof for a class of feedforward models of object recognition in cortex.",
keywords = "Model, Neural network, Object recognition, Scene understanding, Visual cortex",
author = "Thomas Serre and Lior Wolf and Stanley Bileschi and Maximilian Riesenhuber and Tomaso Poggio",
note = "Funding Information: The authors would like to thank Sharat Chikkerur and Timothee Masquelier for useful comments on this manuscript. This report describes research done at the Center for Biological & Computational Learning, which is in the McGovern Institute for Brain Research at MIT, the Department of Brain & Cognitive Sciences, and the Computer Sciences & Artificial Intelligence Laboratory (CSAIL). This research was sponsored by grants from: the US Defense Advanced Research Projects Agency (B. Yoon), US Office of Naval Research (DARPA), US National Science Foundation-National Institutes of Health (CRCNS). Additional support was provided by: Daimler-Chrysler AG, Eastman Kodak Company, Honda Research Institute USA, Inc., Komatsu Ltd., Oxygen, Siemens Corporate Research, Inc., Sony, Sumitomo Metal Industries, Toyota Motor Corporation, and the Eugene McDermott Foundation.",
year = "2007",
month = mar,
doi = "10.1109/TPAMI.2007.56",
language = "אנגלית",
volume = "29",
pages = "411--426",
journal = "IEEE Transactions on Pattern Analysis and Machine Intelligence",
issn = "0162-8828",
publisher = "IEEE Computer Society",
number = "3",
}