@inproceedings{2ba9f9b23f1f4f7c83be9d1eba8256f9,
title = "Understanding Global Structure Relation via Reversible Visual State Space Model for Robust Cross-View Geo-Localization",
abstract = "Cross-view geo-localization aims to match images captured from different views over the same geographic region. Existing methods typically determine spatial correlations between cross-view images according to the similarity of representations extracted from salient areas. However, such local appearance representations fail to capture the underlying structural relationships among the corresponding regions, which severely undermines the reliability of localization results in complex scenes. To address this problem, we propose a reversible visual state-space model to enhance the understanding of global structural relations inherent in images captured from different views. Specifically, we design a progressive spatial analysis approach, which incrementally integrates geometric dependencies exploited at different levels to improve the understanding of the global structure. Moreover, we introduce a reversible rotational scanning mechanism based on the 2D-selective-scan (SS2D) module to facilitate the exploitation of geometric dependencies between cross-view images. Finally, we adopt the cross-dimension interaction strategy to enrich the informativeness of representations in the common space, thereby reinforcing the discriminability of cross-view representations between different regions. Extensive experiments on the University-1652 and University160k-WX datasets demonstrate that the proposed method achieves state-of-the-art performance while maintaining robustness under complex environmental conditions.",
keywords = "Cross-view Geo-localization, Structure Relation, State Space Model",
author = "Peiyuan Ma and Yimin Fu and Jialin Lyu and Zhunga Liu",
note = "This work was supported by the National Natural Science Foundation of China under Grant 62425308 and Grant U24B20178. Publisher copyright: {\textcopyright} 2025 Copyright held by the owner/author(s).",
year = "2025",
month = oct,
day = "31",
doi = "10.1145/3728482.3757390",
language = "English",
series = "MM: International Multimedia Conference",
publisher = "Association for Computing Machinery (ACM)",
pages = "42–46",
booktitle = "UAVM 2025 - Proceedings of the 3rd International Workshop on UAVs in Multimedia",
address = "United States",
}