@inproceedings{f97e68b76d2547948ac0332ea4fef322,
title = "Making computers look the way we look: Exploiting visual attention for image understanding",
abstract = "Human Visual attention (HVA) is an important strategy to focus on specific information while observing and understanding visual stimuli. HVA involves making a series of fixations on select locations while performing tasks such as object recognition, scene understanding, etc. We present one of the first works that combines fixation information with automated concept detectors to (i) infer abstract image semantics, and (ii) enhance performance of object detectors. We develop visual attention-based models that sample fixation distributions and fixation transition distributions in regions-of-interest (ROI) to infer abstract semantics such as expressive faces and interactions (such as look, read, etc.). We also exploit eye-gaze information to deduce possible locations and scale of salient concepts and aid state-of-art detectors. A 18% performance increase with over 80% reduction in computational time for a state-of-art object detector [4].",
keywords = "abstract, eye-tracker, fixations, salient regions, visual attention",
author = "Harish Katti and Ramanathan Subramanian and Mohan Kankanhalli and Nicu Sebe and Chua, {Tat Seng} and Ramakrishnan, {Kalpathi R.}",
year = "2010",
doi = "10.1145/1873951.1874047",
language = "English",
isbn = "9781605589336",
series = "MM'10 - Proceedings of the ACM Multimedia 2010 International Conference",
publisher = "Association for Computing Machinery (ACM)",
pages = "667--670",
editor = "{del Bimbo}, {Alberto } and Shih-Fu Chang and Arnold Smeulders",
booktitle = "MM'10 - Proceedings of the ACM Multimedia 2010 International Conference",
address = "United States",
}