@inproceedings{d762735a3b704d2684b3904557003df9,
title = "Exploiting attention for visual relationship detection",
abstract = "Visual relationship detection targets on predicting categories of predicates and object pairs, and also locating the object pairs. Recognizing the relationships between individual objects is important for describing visual scenes in static images. In this paper, we propose a novel end-to-end framework on the visual relationship detection task. First, we design a spatial attention model for specializing predicate features. Compared to a normal ROI-pooling layer, this structure significantly improves Predicate Classification performance. Second, for extracting relative spatial configuration, we propose to map simple geometric representations to a high dimension, which boosts relationship detection accuracy. Third, we implement a feature embedding model with a bi-directional RNN which considers subject, predicate and object as a time sequence. We evaluate our method on three tasks. The experiments demonstrate that our method achieves competitive results compared to state-of-the-art methods.",
keywords = "2021 OA procedure",
author = "Tongxin Hu and Wentong Liao and Yang, {Michael Ying} and Bodo Rosenhahn",
year = "2019",
month = oct,
day = "25",
doi = "10.1007/978-3-030-33676-9_23",
language = "English",
isbn = "978-3-030-33675-2",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "331--344",
editor = "Fink, {Gernot A.} and Simone Frintrop and Xiaoyi Jiang",
booktitle = "Pattern Recognition",
address = "Germany",
note = "41st DAGM German Conference on Pattern Recognition, DAGM GCPR 2019 ; Conference date: 10-09-2019 Through 13-09-2019",
}