@inproceedings{6c7f6020b5b14eaa8d825323ca851af3,
title = "Fusing object detection and region appearance for image-text alignment",
abstract = "We present a method for automatically aligning words to image regions that integrates specific object classifiers (e.g., {"}car{"}detectors) with weak models based on appearance features. Previous strategies have largely focused on the latter, and thus have not exploited progress on object category recognition. Hence, we augment region labeling with object detection, which simplifies the problem by reliably identifying a subset of the labels, and thereby reducing correspondence ambiguity overall. Comprehensive testing on the SAIAPR TC dataset shows that principled integration of object detection improves the region labeling task.",
keywords = "Algorithms, Performance",
author = "{Del Pero}, Luca and Philip Lee and James Magahern and Emily Hartley and Kobus Barnard",
year = "2011",
doi = "10.1145/2072298.2071951",
language = "English (US)",
isbn = "9781450306164",
series = "MM'11 - Proceedings of the 2011 ACM Multimedia Conference and Co-Located Workshops",
pages = "1113--1116",
booktitle = "MM'11 - Proceedings of the 2011 ACM Multimedia Conference and Co-Located Workshops",
note = "19th ACM International Conference on Multimedia ACM Multimedia 2011, MM'11 ; Conference date: 28-11-2011 Through 01-12-2011",
}