@inproceedings{d9edd5d92675444c8daedfce0039ea0c,
title = "Learning Dense Correspondences via Local and Non-local Feature Fusion",
abstract = "We present a learning-based method for extracting distinctive features on video objects. From the extracted features, we are able to derive dense correspondences between the objects in the current video frame and in the reference template. We train a deep-learning model with non-local blocks to predict dense feature maps for long-range dependencies. A new video object correspondence dataset is introduced for training and for evaluation. Further, we propose a new feature-aggregation technique that is based on the optical flow of consecutive frames and we apply it to the integration of multiple feature maps for alleviating uncertainties. We also use the local information provided by optical flow to evaluate the reliability of feature matching. The experimental results show that our local and nonlocal fusion approach can reduce unreliable correspondences and thus improve the matching accuracy.",
author = "Chin, {Wen Chi} and Jhang, {Zih Jian} and Huang, {Yan Hao} and Koichi Ito and Chen, {Hwann Tzong}",
note = "Publisher Copyright: {\textcopyright} 2020 APSIPA.; 2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 ; Conference date: 07-12-2020 Through 10-12-2020",
year = "2020",
month = dec,
day = "7",
language = "English",
series = "2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1087--1095",
booktitle = "2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 - Proceedings",
address = "United States",
}