@inproceedings{b7aa23ebaef04840903a85b1b4e7d02d,
title = "NOPE: Novel Object Pose Estimation from a Single Image",
abstract = "The practicality of 3D object pose estimation remains limited for many applications due to the need for prior knowledge of a 3D model and a training period for new objects. To address this limitation, we propose an approach that takes a single image of a new object as input and pre-dicts the relative pose of this object in new images without prior knowledge of the object's 3D model and without re-quiring training time for new objects and categories. We achieve this by training a model to directly predict discrim-inative embeddings for viewpoints surrounding the object. This prediction is done using a simple U-Net architecture with attention and conditioned on the desired pose, which yields extremely fast inference. We compare our approach to state-of-the-art methods and show it outperforms them both in terms of accuracy and robustness.",
keywords = "object pose estimation",
author = "Nguyen, \{Van Nguyen\} and Thibault Groueix and Georgy Ponimatkin and Yinlin Hu and Renaud Marlet and Mathieu Salzmann and Vincent Lepetit",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2024 ; Conference date: 16-06-2024 Through 22-06-2024",
year = "2024",
month = jan,
day = "1",
doi = "10.1109/CVPR52733.2024.01697",
language = "English",
isbn = "9798350353006",
series = "Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition",
publisher = "IEEE Computer Society",
pages = "17923--17932",
booktitle = "Proceedings - 2024 IEEE/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2024",
}