Publications

The archive.

Peer-reviewed publications and preprints from the lab and our collaborators. Reference implementations are released on GitHub when review and clinical-data licensing allow.

2024 WACV
A Survey on Multimodal Large Language Models for Autonomous Driving (opens in new tab)
Cui C, Ma Y, Cao X, Ye W, …, Cao J, Wang Z, Zheng C.
Cite
@inproceedings{cui2024survey,
  title={A Survey on Multimodal Large Language Models for Autonomous Driving},
  author={Cui, C. and Ma, Y. and Cao, X. and Ye, W. and others},
  booktitle={IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshop},
  year={2024},
  url={https://arxiv.org/abs/2311.12320}
}
2024 WACV
Drive as You Speak: Enabling human-like interaction with LLMs in autonomous vehicles (opens in new tab)
Cui C, Ma Y, Cao X, Ye W, Wang Z.
Cite
@inproceedings{cui2024drive,
  title={Drive as You Speak: Enabling Human-Like Interaction with Large Language Models in Autonomous Vehicles},
  author={Cui, C. and Ma, Y. and Cao, X. and Ye, W. and Wang, Z.},
  booktitle={IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshop},
  year={2024},
  url={https://arxiv.org/abs/2309.10228}
}
2024 WACV
MACP: Efficient Model Adaptation for Cooperative Perception (opens in new tab)
Ma Y, Lu J, Cui C, Zhao S, Cao X, Ye W, Wang Z.
Cite
@inproceedings{ma2024macp,
  title={MACP: Efficient Model Adaptation for Cooperative Perception},
  author={Ma, Y. and Lu, J. and Cui, C. and Zhao, S. and Cao, X. and Ye, W. and Wang, Z.},
  booktitle={IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)},
  year={2024},
  url={https://arxiv.org/abs/2310.16870v2}
}
2023 ICASSP
ViTASD: Robust Vision Transformer Baselines for Autism Spectrum Disorder Facial Diagnosis (opens in new tab)
Cao X, Ye W, Sizikova E, Bai X, Coffee M, Zeng H, Cao J.
Code
Cite
@inproceedings{cao2023vitasd,
  title={ViTASD: Robust Vision Transformer Baselines for Autism Spectrum Disorder Facial Diagnosis},
  author={Cao, X. and Ye, W. and Sizikova, E. and Bai, X. and Coffee, M. and Zeng, H. and Cao, J.},
  booktitle={IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
  year={2023},
  url={https://ieeexplore.ieee.org/document/10094684}
}
2022 IJCAI
AggPose: Deep aggregation vision transformer for infant pose estimation (opens in new tab)
Cao X, Li X, Ma L, Huang Y, Feng X, Chen Z, Zeng H, Cao J.
Code
Cite
@inproceedings{cao2022aggpose,
  title={AggPose: Deep Aggregation Vision Transformer for Infant Pose Estimation},
  author={Cao, X. and Li, X. and Ma, L. and Huang, Y. and Feng, X. and Chen, Z. and Zeng, H. and Cao, J.},
  booktitle={Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence (IJCAI)},
  year={2022},
  url={https://www.ijcai.org/proceedings/2022/700}
}
2023 Preprint
PIE: Simulating Disease Progression via Progressive Image Editing (opens in new tab)
Liang K, Cao X, Liao KD, Gao T, Ye W, Chen Z, Cao J, Nama T, Sun J.
Code
Cite
@article{liang2023pie,
  title={PIE: Simulating Disease Progression via Progressive Image Editing},
  author={Liang, K. and Cao, X. and Liao, K. D. and Gao, T. and Ye, W. and Chen, Z. and Cao, J. and Nama, T. and Sun, J.},
  journal={arXiv preprint arXiv:2309.11745},
  year={2023},
  url={https://arxiv.org/abs/2309.11745}
}