@@ -72,6 +72,46 @@ <h3>All Publications (from newest to oldest)</h3>
7272 -->
7373 < h4 > 2025</ h4 >
7474 < p > < ul class ="ul-paper ">
75+ < li class ="li-paper ">
76+ < span class ="title ">
77+ SafeKey: Amplifying Aha-Moment Insights for Safety Reasoning</ span >
78+ < span > Kaiwen Zhou, Yue Fan, Kian Ahrabian, Dan Roth, Xin Eric Wang</ span >
79+ < span >
80+ < b > EMNLP 2025</ b >
81+ </ span >
82+ </ li >
83+ < li class ="li-paper ">
84+ < span class ="title ">
85+ Hidden in Plain Sight: Probing Implicit Reasoning in Multimodal Language Models</ span >
86+ < span > Qianqi Yan, Kaiwen Zhou, Shan Jiang, Yue Fan, Xin Eric Wang</ span >
87+ < span >
88+ < b > EMNLP 2025</ b >
89+ </ span >
90+ </ li >
91+ < li class ="li-paper ">
92+ < span class ="title ">
93+ GUI-Bee: Align GUI Action Grounding to Novel Environments via Autonomous Exploration</ span >
94+ < span > Jiuzhou Han, Yue Fan, Lei Ding, Weixi Feng, Linjie Li, Zhengyuan Yang, Kevin Lin, Jianfeng Wang, Lijuan Wang, Xin Eric Wang</ span >
95+ < span >
96+ < b > EMNLP 2025</ b >
97+ </ span >
98+ </ li >
99+ < li class ="li-paper ">
100+ < span class ="title ">
101+ Agent S2: A Compositional Generalist-Specialist Framework for Computer Use Agents</ span >
102+ < span > Jiuzhou Han*, Saaket Agashe*, Shuyu Gan, Ying Chen, Yue Fan, Xin Eric Wang</ span >
103+ < span >
104+ < b > COLM 2025</ b >
105+ </ span >
106+ </ li >
107+ < li class ="li-paper ">
108+ < span class ="title ">
109+ VLM4D: Towards Spatiotemporal Awareness in Vision Language Models</ span >
110+ < span > Weixi Feng*, Yue Fan*, Jiuzhou Han, Kaizhi Zheng, Kaiwen Zhou, Shan Jiang, Yang Zhao, Yachuan Li, Xin Eric Wang</ span >
111+ < span >
112+ < b > ICCV 2025</ b >
113+ </ span >
114+ </ li >
75115 < li class ="li-paper ">
76116 < span class ="title ">
77117 Multimodal Inconsistency Reasoning (MMIR): A New Benchmark for Multimodal Reasoning Models</ span >
@@ -80,7 +120,6 @@ <h4>2025</h4>
80120 < b > Findings of ACL 2025</ b >
81121 </ span >
82122 </ li >
83-
84123 < li class ="li-paper ">
85124 < span class ="title ">
86125 Worse than Random? An Embarrassingly Simple Probing Evaluation of Large Multimodal Models in Medical VQA</ span >
@@ -90,7 +129,6 @@ <h4>2025</h4>
90129 < em > NeurIPS 2024 Workshop on GenAI for Health</ em >
91130 </ span >
92131 </ li >
93-
94132 < li class ="li-paper ">
95133 < span class ="title ">
96134 Agent S: An Open Agentic Framework that Uses Computers Like a Human</ span >
0 commit comments