@article{2026milr,title={MILR: Improving Multimodal Image Generation via Test-Time Latent Reasoning },author={Mi, Yapeng and Zhao, Yanpeng and Li, Hengli and Li, Chenxi and Wu, Huimin and Ma, Xiaojian and Zhu, Song-Chun and Wu, Ying Nian and Li, Qing},journal={International Conference on Learning Representations (ICLR)},year={2026},correspondence={Zhao, Yanpeng and Li, Qing},}
SceneDreamer360: Text-Driven 3D-Consistent Scene Generation with Panoramic Gaussian Splatting
Wenrui Li , Fucheng Cai , Yapeng Mi , Zhe Yang , Wangmeng Zuo , Xingtao Wang , and Xiaopeng Fan✉
@article{li2024scenedreamer360,title={SceneDreamer360: Text-Driven 3D-Consistent Scene Generation with Panoramic Gaussian Splatting},author={Li, Wenrui and Cai, Fucheng and Mi, Yapeng and Yang, Zhe and Zuo, Wangmeng and Wang, Xingtao and Fan, Xiaopeng},journal={IEEE Transactions on Multimedia},year={2026},correspondence={Fan, Xiaopeng},}
2025
Iterative Tool Usage Exploration for Multimodal Agents via Step-wise Preference Tuning
@article{2025iterative,title={Iterative Tool Usage Exploration for Multimodal Agents via Step-wise Preference Tuning },author={Li, Pengxiang and Gao, Zhi and Zhang, Bofei and Mi, Yapeng and Ma, Xiaojian and Shi, Chenrui and Yuan, Tao and Wu, Yuwei and Jia, Yunde and Zhu, Song-Chun and Li, Qing},equalauthor={ Li, Pengxiang and Gao, Zhi},journal={Advances in Neural Information Processing Systems (NeurIPS)},year={2025},correspondence={Wu, Yuwei and Li, Qing},}
Building LLM Agents by Incorporating Insights from Computer Systems
@article{mi2025building,title={Building LLM Agents by Incorporating Insights from Computer Systems },author={Mi, Yapeng and Gao, Zhi and Ma, Xiaojian and Li, Qing},journal={arXiv preprint arXiv:2504.04485},year={2025},correspondence={Li, Qing},}