@inproceedings{d2fab6b87d5c457e9fc21c2fae3b37bd,
title = "SceneNet: A perceptual ontology for scene understanding",
abstract = "Scene recognition systems which attempt to deal with a large number of scene categories currently lack proper knowledge about the perceptual ontology of scene categories and would enjoy significant advantage from a perceptually meaningful scene representation. In this work we perform a large-scale human study to create “SceneNet”, an online ontology database for scene understanding that organizes scene categories according to their perceptual relationships. This perceptual ontology suggests that perceptual relationships do not always conform the semantic structure between categories, and it entails a lower dimensional perceptual space with “perceptually meaningful” Euclidean distance, where each embedded category is represented by a single prototype. Using the SceneNet ontology and database we derive a computational scheme for learning non-linear mapping of scene images into the perceptual space, where each scene image is closest to its category prototype than to any other prototype by a large margin. Then, we demonstrate how this approach facilitates improvements in large-scale scene categorization over state-of-the-art methods and existing semantic ontologies, and how it reveals novel perceptual findings about the discriminative power of visual attributes and the typicality of scenes.",
keywords = "Perceptual relations, Perceptual space, Scene categories, Scene gist recognition, Scene understanding",
author = "Ilan Kadar and Ohad Ben-Shahar",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2015.; 13th European Conference on Computer Vision, ECCV 2014 ; Conference date: 06-09-2014 Through 12-09-2014",
year = "2015",
month = jan,
day = "1",
doi = "10.1007/978-3-319-16181-5_27",
language = "English",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "385--400",
editor = "Carsten Rother and Bronstein, {Michael M.} and Lourdes Agapito",
booktitle = "Computer Vision - ECCV 2014 Workshops, Proceedings",
address = "Germany",
}