Publications

CVPR 2026
SceneVerse++ teaser

Lifting Unlabeled Internet-level Data for 3D Scene Understanding

Yixin Chen, Yaowei Zhang, Huangyue Yu, Junchao He, Yan Wang, Jiangyong Huang, Hongyu Shen, Junfeng Ni, Shaofei Wang, Baoxiong Jia, Song-Chun Zhu, Siyuan Huang

BibTeX
@inproceedings{chen2026lifting,
          title     = {Lifting Unlabeled Internet-level Data for 3D Scene Understanding},
          author    = {Chen, Yixin and Zhang, Yaowei and Yu, Huangyue and He, Junchao and Wang, Yan and Huang, Jiangyong and Shen, Hongyu and Ni, Junfeng and Wang, Shaofei and Jia, Baoxiong and Zhu, Song-Chun and Huang, Siyuan},
          booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
          year      = {2026}
        }
CVPR 2025
MPEC teaser

Masked Point-Entity Contrast for Open-Vocabulary 3D Scene Understanding

Yan Wang*, Baoxiong Jia*, Ziyu Zhu, Siyuan Huang

BibTeX
@inproceedings{wang2025masked,
  author    = {Wang, Yan and Jia, Baoxiong and Zhu, Ziyu and Huang, Siyuan},
  title     = {Masked Point-Entity Contrast for Open-Vocabulary 3D Scene Understanding},
  booktitle = {CVPR},
  year      = {2025}
}
CVPR 2025
Beacon3D teaser

Unveiling the Mist over 3D Vision-Language Understanding: Object-centric Evaluation with Chain-of-Analysis

Jiangyong Huang*, Baoxiong Jia*, Yan Wang, Ziyu Zhu, Xiongkun Linghu, Qing Li, Song-Chun Zhu, Siyuan Huang

BibTeX
@inproceedings{huang2025unveiling,
  title     = {Unveiling the Mist over 3D Vision-Language Understanding: Object-centric Evaluation with Chain-of-Analysis},
  author    = {Huang, Jiangyong and Jia, Baoxiong and Wang, Yan and Zhu, Ziyu and Linghu, Xiongkun and Li, Qing and Zhu, Song-Chun and Huang, Siyuan},
  booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
  year      = {2025}
}
ECCV 2024
SceneVerse teaser

SceneVerse: Scaling 3D Vision-Language Learning for Grounded Scene Understanding

Baoxiong Jia*, Yixin Chen*, Huangyue Yu, Yan Wang, Xuesong Niu, Tengyu Liu, Qing Li, Siyuan Huang

BibTeX
@inproceedings{jia2024sceneverse,
  title     = {SceneVerse: Scaling 3D Vision-Language Learning for Grounded Scene Understanding},
  author    = {Jia, Baoxiong and Chen, Yixin and Yu, Huangyue and Wang, Yan and Niu, Xuesong and Liu, Tengyu and Li, Qing and Huang, Siyuan},
  booktitle = {European Conference on Computer Vision (ECCV)},
  year      = {2024}
}
ICML 2024
LEO teaser

An Embodied Generalist Agent in 3D World

Jiangyong Huang*, Silong Yong*, Xiaojian Ma*, Xiongkun Linghu*, Puhao Li, Yan Wang, Qing Li, Song-Chun Zhu, Baoxiong Jia, Siyuan Huang

BibTeX
@inproceedings{huang2024embodied,
  title     = {An Embodied Generalist Agent in 3D World},
  author    = {Huang, Jiangyong and Yong, Silong and Ma, Xiaojian and Linghu, Xiongkun and Li, Puhao and Wang, Yan and Li, Qing and Zhu, Song-Chun and Jia, Baoxiong and Huang, Siyuan},
  booktitle = {Proceedings of the International Conference on Machine Learning (ICML)},
  year      = {2024}
}
AAAI 2023
SSDA3D teaser

SSDA3D: Semi-supervised Domain Adaptation for 3D Object Detection from Point Cloud

Yan Wang*, Junbo Yin*, Wei Li, Pascal Frossard, Ruigang Yang, Jianbing Shen

BibTeX
@inproceedings{wang2023ssda3d,
  title     = {SSDA3D: Semi-supervised Domain Adaptation for 3D Object Detection from Point Cloud},
  author    = {Wang, Yan and Yin, Junbo and Li, Wei and Frossard, Pascal and Yang, Ruigang and Shen, Jianbing},
  booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
  year      = {2023}
}

* denotes equal contribution.