@inproceedings{a6795841acde43f8bc342575ba942829,
title = "GMAMflow: Learning Optical Flow through Global Multi-scale Attention Matching",
abstract = "Optical flow estimation is essential for various computer vision applications, including autonomous vehicles, object tracking, and frame interpolation. However, enhancing the accuracy of optical flow algorithms while optimizing their structural complexity continues to be a formidable challenge. This paper presents GMAMflow, a groundbreaking optical flow estimation model that leverages a global multi-scale attention mechanism. Our enhancement of the existing EMA allows the network to more effectively capture intricate details across diverse scales within complex imagery. The architectural refinements to the GMflow framework are specifically designed to elevate the learning process of optical flow. Comprehensive experimental validation using the Sintel dataset demonstrates that our approach achieves higher accuracy and outperforms competing methods. These results signify a significant stride in optical flow research, offering not only theoretical contributions but also practical implications for the advancement of technology in associated domains.",
keywords = "attention mechanism, deep learning, motion estimation, neural network, Optical flow",
author = "Jiaxuan Lin and Qiyuan Zhang and Xiaochen Yuan",
note = "Publisher Copyright: {\textcopyright} 2025 SPIE.; 16th International Conference on Signal Processing Systems, ICSPS 2024 ; Conference date: 15-11-2024 Through 17-11-2024",
year = "2025",
doi = "10.1117/12.3061529",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Robert Minasian and Li Chai",
booktitle = "Sixteenth International Conference on Signal Processing Systems, ICSPS 2024",
address = "United States",
}