@inproceedings{82e65dd4d8ec474d90c402764f03d918,
title = "Transformer-Based Zero-Shot Detection via Contrastive Learning",
abstract = "Zero-Shot Detection (ZSD) is a challenging computer vision problem that enables simultaneous classification and localization of previously unseen objects via auxiliary information. Most of the existing methods learn a biased visual-semantic mapping function, which prefers predicting seen classes during testing, and they only focus on region of interest and ignore contextual information in an image. To tackle these problems, we propose a novel framework for ZSD named Transformer-based Zero-Shot Detection via Contrastive Learning (TZSDC). The proposed TZSDC contains four components: transformer-based backbone, Foreground-Background (FB) separation module, Instance-Instance Contrastive Learning (IICL) module, and Knowledge-Transfer (KT) module. The transformer backbone encodes long-range contextual information with less inductive bias. The FB module separates foreground and background by scoring objectness from images. The IICL module optimizes the visual structure in embedding space to make it more discriminative and the KT module transfers knowledge from seen classes to unseen classes via category similarity. Benefiting from these modules, the accurate alignment between the contextual visual features and semantic features can be achieved. Experiments on MSCOCO well validate the effectiveness of the proposed method for ZSD and generalized ZSD.",
keywords = "Contrastive learning, Transformer, Zero-Shot Detection",
author = "Wei Liu and Hui Chen and Yongqiang Ma and Jianji Wang and Nanning Zheng",
note = "Publisher Copyright: {\textcopyright} 2022, IFIP International Federation for Information Processing.; 18th IFIP WG 12.5 International Conference on Artificial Intelligence Applications and Innovations, AIAI 2022 ; Conference date: 17-06-2022 Through 20-06-2022",
year = "2022",
doi = "10.1007/978-3-031-08333-4\_26",
language = "英语",
isbn = "9783031083327",
series = "IFIP Advances in Information and Communication Technology",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "316--327",
editor = "Ilias Maglogiannis and Lazaros Iliadis and John Macintyre and Paulo Cortez",
booktitle = "Artificial Intelligence Applications and Innovations - 18th IFIP WG 12.5 International Conference, AIAI 2022, Proceedings",
}