@inproceedings{68ec99133a5f44518da925319f42206c,
title = "SLAM3R: Real-Time Dense Scene Reconstruction from Monocular RGB Videos",
abstract = "In this paper, we introduce SLAM3R, a novel and effective system for real-time, high-quality, dense 3D reconstruction using RGB videos. SLAM3R provides an end-to-end solution by seamlessly integrating local 3D reconstruction and global coordinate registration through feed-forward neural networks. Given an input video, the system first converts it into overlapping clips using a sliding window mechanism. Unlike traditional pose optimization-based methods, SLAM3R directly regresses 3D pointmaps from RGB images in each window and progressively aligns and deforms these local pointmaps to create a globally consistent scene reconstruction-all without explicitly solving any camera parameters. Experiments across datasets consistently show that SLAM3R achieves state-of-the-art reconstruction accuracy and completeness while maintaining real-time performance at 20+ FPS. Code available at: https://github.com/PKU-VCL-3DV/SLAM3R.",
keywords = "relative camera pose regression, visual localization",
author = "Yuzheng Liu and Siyan Dong and Shuzhe Wang and Yingda Yin and Yanchao Yang and Qingnan Fan and Baoquan Chen",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; IEEE Conference on Computer Vision and Pattern Recognition, CVPR ; Conference date: 10-06-2025 Through 17-06-2025",
year = "2025",
doi = "10.1109/CVPR52734.2025.01552",
language = "English",
isbn = "979-8-3315-4365-5",
series = "IEEE Computer Society Conference on Computer Vision and Pattern Recognition",
publisher = "IEEE",
booktitle = "2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
address = "United States",
}