|
1 | 1 | [ |
2 | 2 | { |
3 | | - "category": [], |
| 3 | + "category": ["DigitalAIAgents"], |
4 | 4 | "title": "AgentTrek: Agent Trajectory Synthesis via Guiding Replay with Web Tutorials", |
5 | 5 | "authors": "Yiheng Xu, Dunjie Lu, Zhennan Shen, Junli Wang, Zekun Wang, Yuchen Mao, Caiming Xiong, Tao Yu", |
6 | 6 | "publication": "Preprint", |
|
12 | 12 | "image": "/research/agenttrek.jpg" |
13 | 13 | }, |
14 | 14 | { |
15 | | - "category": [], |
| 15 | + "category": ["DigitalAIAgents"], |
16 | 16 | "title": "Aguvis: Unified Pure Vision Agents for Autonomous GUI Interaction", |
17 | 17 | "authors": "Yiheng Xu, Zekun Wang, Junli Wang, Dunjie Lu, Tianbao Xie, Amrita Saha, Doyen Sahoo, Tao Yu, Caiming Xiong", |
18 | 18 | "publication": "Preprint", |
|
24 | 24 | "image": "/research/aguvis.jpg" |
25 | 25 | }, |
26 | 26 | { |
27 | | - "category": ["Grounding"], |
| 27 | + "category": ["CodeGeneration"], |
28 | 28 | "title": "BRIGHT: A Realistic and Challenging Benchmark for Reasoning-Intensive Retrieval", |
29 | 29 | "authors": "Hongjin Su, Howard Yen, Mengzhou Xia, Weijia Shi, Niklas Muennighoff, Han-yu Wang, Haisu Liu, Quan Shi, Zachary S. Siegel, Michael Tang, Ruoxi Sun, Jinsung Yoon, Sercan O. Arik, Danqi Chen, Tao Yu", |
30 | 30 | "publication": "Preprint", |
|
36 | 36 | "image": "/research/bright.jpg" |
37 | 37 | }, |
38 | 38 | { |
39 | | - "category": ["Grounding"], |
| 39 | + "category": ["CodeGeneration"], |
40 | 40 | "title": "Spider2-V: How Far Are Multimodal Agents From Automating Data Science and Engineering Workflows?", |
41 | 41 | "authors": "Ruisheng Cao, Fangyu Lei, Haoyuan Wu, Jixuan Chen, Yeqiao Fu, Hongcheng Gao, Xinzhuang Xiong, Hanchong Zhang, Yuchen Mao, Wenjing Hu, Tianbao Xie, Hongshen Xu, Danyang Zhang, Sida Wang, Ruoxi Sun, Pengcheng Yin, Caiming Xiong, Ansong Ni, Qian Liu, Victor Zhong, Lu Chen, Kai Yu, Tao Yu", |
42 | 42 | "publication": "NeurIPS 2024, Spotlight", |
|
48 | 48 | "image": "/research/spider2v.jpg" |
49 | 49 | }, |
50 | 50 | { |
51 | | - "category": [], |
| 51 | + "category": ["DigitalAIAgents"], |
52 | 52 | "title": "Attacking Vision-Language Computer Agents via Pop-ups", |
53 | 53 | "authors": "Yanzhe Zhang, Tao Yu, Diyi Yang", |
54 | 54 | "publication": "Preprint", |
|
60 | 60 | "image": "/research/attack.jpg" |
61 | 61 | }, |
62 | 62 | { |
63 | | - "category": ["Grounding"], |
| 63 | + "category": ["CodeGeneration"], |
64 | 64 | "title": "Spider 2.0: Evaluating Language Models on Real-World Enterprise Text-to-SQL Workflows", |
65 | 65 | "authors": "Fangyu Lei, Jixuan Chen, Yuxiao Ye, Ruisheng Cao, Dongchan Shin, Hongjin Su, Zhaoqing Suo, Hongcheng Gao, Wenjing Hu, Pengcheng Yin, Victor Zhong, Caiming Xiong, Ruoxi Sun, Qian Liu, Sida Wang, Tao Yu", |
66 | 66 | "publication": "Preprint", |
|
72 | 72 | "image": "/research/spider2.jpg" |
73 | 73 | }, |
74 | 74 | { |
75 | | - "category": ["PoweredAgents", "InteractiveSystems", "ToolUse"], |
| 75 | + "category": ["DigitalAIAgents"], |
76 | 76 | "title": "OSWorld: Benchmarking Multimodal Agents for Open-Ended Tasks in Real Computer Environments", |
77 | 77 | "authors": "Tianbao Xie, Danyang Zhang, Jixuan Chen, Xiaochuan Li, Siheng Zhao, Ruisheng Cao, Toh Jing Hua, Zhoujun Cheng, Dongchan Shin, Fangyu Lei, Yitao Liu, Yiheng Xu, Shuyan Zhou, Silvio Savarese, Caiming Xiong, Victor Zhong, Tao Yu", |
78 | 78 | "publication": "NeurIPS 2024", |
|
84 | 84 | "image": "/research/osworld.png" |
85 | 85 | }, |
86 | 86 | { |
87 | | - "category": ["Grounding", "EfficientLLMs"], |
| 87 | + "category": ["CodeGeneration"], |
88 | 88 | "title": "EvoR: Evolving Retrieval for Code Generation", |
89 | 89 | "authors": "Hongjin Su, Shuyang Jiang, Yuhang Lai, Haoyuan Wu, Boao Shi, Che Liu, Qian Liu, Tao Yu", |
90 | 90 | "publication": "Preprint", |
|
96 | 96 | "image": "/research/ark.jpeg" |
97 | 97 | }, |
98 | 98 | { |
99 | | - "category": ["EfficientLLMs"], |
| 99 | + "category": ["CodeGeneration"], |
100 | 100 | "title": "Generative Representational Instruction Tuning", |
101 | 101 | "authors": "Niklas Muennighoff, Hongjin Su, Liang Wang, Nan Yang, Furu Wei, Tao Yu, Amanpreet Singh, Douwe Kiela", |
102 | 102 | "publication": "Preprint", |
|
108 | 108 | "image": "/research/grit.jpeg" |
109 | 109 | }, |
110 | 110 | { |
111 | | - "category": ["PoweredAgents", "InteractiveSystems", "ToolUse"], |
| 111 | + "category": ["DigitalAIAgents"], |
112 | 112 | "title": "OS-Copilot: Towards Generalist Computer Agents with Self-Improvement", |
113 | 113 | "authors": "Zhiyong Wu, Chengcheng Han, Zichen Ding, Zhenmin Weng, Zhoumianze Liu, Shunyu Yao, Tao Yu, Lingpeng Kong", |
114 | 114 | "publication": "Preprint", |
|
120 | 120 | "image": "/research/os-copilot.png" |
121 | 121 | }, |
122 | 122 | { |
123 | | - "category": ["PoweredAgents", "InteractiveSystems"], |
| 123 | + "category": ["DigitalAIAgents"], |
124 | 124 | "title": "OpenAgents: An Open Platform for Language Agents in the Wild", |
125 | 125 | "authors": "Tianbao Xie*, Fan Zhou*, Zhoujun Cheng*, Peng Shi*, Luoxuan Weng*, Yitao Liu*, Toh Jing Hua, Junning Zhao, Qian Liu, Che Liu, Leo Z. Liu, Yiheng Xu, Hongjin Su, Dongchan Shin, Caiming Xiong, Tao Yu", |
126 | 126 | "publication": "Preprint", |
|
132 | 132 | "image": "/research/openagents.png" |
133 | 133 | }, |
134 | 134 | { |
135 | | - "category": ["PoweredAgents", "Grounding", "ToolUse"], |
| 135 | + "category": ["PhysicalAIAgents"], |
136 | 136 | "title": "Lemur: Harmonizing Natural Language and Code for Language Agents", |
137 | 137 | "authors": "Yiheng Xu*, Hongjin Su*, Chen Xing*, Boyu Mi, Qian Liu, Weijia Shi, Binyuan Hui, Fan Zhou, Yitao Liu, Tianbao Xie, Zhoujun Cheng, Siheng Zhao, Lingpeng Kong, Bailin Wang, Caiming Xiong, Tao Yu", |
138 | 138 | "publication": "ICLR 2024 Spotlight", |
|
148 | 148 | ] |
149 | 149 | }, |
150 | 150 | { |
151 | | - "category": ["Grounding", "Robotics"], |
| 151 | + "category": ["PhysicalAIAgents"], |
152 | 152 | "title": "Text2Reward: Automated Dense Reward Function Generation for Reinforcement Learning\n", |
153 | 153 | "authors": "Tianbao Xie*, Siheng Zhao*, Chen Henry Wu, Yitao Liu, Qian Luo, Victor Zhong, Yanchao Yang, Tao Yu", |
154 | 154 | "publication": "ICLR 2024 Spotlight", |
|
160 | 160 | "image": "/research/text2reward.png" |
161 | 161 | }, |
162 | 162 | { |
163 | | - "category": ["EfficientLLMs"], |
| 163 | + "category": ["CodeGeneration"], |
164 | 164 | "title": "Instructor Embeddings: One Embedder, Any Task: Instruction-Finetuned Text Embeddings", |
165 | 165 | "authors": "Hongjin Su*, Weijia Shi*, Jungo Kasai, Yizhong Wang, Yushi Hu, Mari Ostendorf, Wen-tau Yih, Noah A. Smith, Luke Zettlemoyer, Tao Yu", |
166 | 166 | "publication": "ACL 2023 Findings", |
|
177 | 177 | ] |
178 | 178 | }, |
179 | 179 | { |
180 | | - "category": ["Grounding"], |
| 180 | + "category": ["CodeGeneration"], |
181 | 181 | "title": "DS-1000: A Natural and Reliable Benchmark for Data Science Code Generation", |
182 | 182 | "authors": "Yuhang Lai*, Chengxi Li*, Yiming Wang*, Tianyi Zhang*, Ruiqi Zhong*, Luke Zettlemoyer, Scott Wen-tau Yih, Daniel Fried, Sida Wang, Tao Yu", |
183 | 183 | "publication": "ICML 2023", |
|
189 | 189 | "image": "/research/ds-1000.jpg" |
190 | 190 | }, |
191 | 191 | { |
192 | | - "category": ["Grounding"], |
| 192 | + "category": ["CodeGeneration"], |
193 | 193 | "title": "Coder Reviewer Reranking for Code Generation", |
194 | 194 | "authors": "Tianyi Zhang, Tao Yu, Tatsunori B. Hashimoto, Mike Lewis, Wen-tau Yih, Daniel Fried, Sida I. Wang", |
195 | 195 | "publication": "ICML 2023", |
|
201 | 201 | "image": "/research/code-review.jpg" |
202 | 202 | }, |
203 | 203 | { |
204 | | - "category": ["EfficientLLMs"], |
| 204 | + "category": ["CodeGeneration"], |
205 | 205 | "title": "Compositional Exemplars for In-context Learning", |
206 | 206 | "authors": "Jiacheng Ye, Zhiyong Wu, Jiangtao Feng, Tao Yu, Lingpeng Kong.", |
207 | 207 | "publication": "ICML 2023", |
|
213 | 213 | "image": "/research/ce-icl.png" |
214 | 214 | }, |
215 | 215 | { |
216 | | - "category": ["Grounding", "ToolUse"], |
| 216 | + "category": ["CodeGeneration"], |
217 | 217 | "title": "Binder: Binding Language Models in Symbolic Languages", |
218 | 218 | "authors": "Zhoujun Cheng*, Tianbao Xie*, Peng Shi, Chengzu Li, Rahul Nadkarni, Yushi Hu, Caiming Xiong, Dragomir Radev, Mari Ostendorf, Luke Zettlemoyer, Noah A Smith, Tao Yu", |
219 | 219 | "publication": "ICLR 2023", |
|
225 | 225 | "image": "/research/binder.jpg" |
226 | 226 | }, |
227 | 227 | { |
228 | | - "category": ["EfficientLLMs"], |
| 228 | + "category": ["CodeGeneration"], |
229 | 229 | "title": "Selective Annotation Makes Language Models Better Few-Shot Learners", |
230 | 230 | "authors": "Hongjin Su, Jungo Kasai, Chen Henry Wu, Weijia Shi, Tianlu Wang, Jiayi Xin, Rui Zhang, Mari Ostendorf, Luke Zettlemoyer, Noah A. Smith, Tao Yu", |
231 | 231 | "publication": "ICLR 2023", |
|
236 | 236 | "image": "/research/selective-annotation.jpg" |
237 | 237 | }, |
238 | 238 | { |
239 | | - "category": ["Grounding", "EfficientLLMs"], |
| 239 | + "category": ["CodeGeneration"], |
240 | 240 | "title": "UnifiedSKG: Unifying and Multi-Tasking Structured Knowledge Grounding with Text-to-Text Language Models", |
241 | 241 | "authors": "Tianbao Xie*, Chen Henry Wu*, Peng Shi, Ruiqi Zhong, Torsten Scholak, Michihiro Yasunaga, Chien-Sheng Wu, Ming Zhong, Pengcheng Yin, Sida I. Wang, Victor Zhong, Bailin Wang, Chengzu Li, Connor Boyle, Ansong Ni, Ziyu Yao, Dragomir Radev, Caiming Xiong, Lingpeng Kong, Rui Zhang, Noah A. Smith, Luke Zettlemoyer, Tao Yu.", |
242 | 242 | "publication": "EMNLP 2022", |
|
248 | 248 | "image": "/research/unifiedskg.jpg" |
249 | 249 | }, |
250 | 250 | { |
251 | | - "category": ["EfficientLLMs"], |
| 251 | + "category": ["CodeGeneration"], |
252 | 252 | "title": "ZeroGen: Efficient Zero-shot Learning via Dataset Generation", |
253 | 253 | "authors": "Jiacheng Ye*, Jiahui Gao*, Qintong Li, Hang Xu, Jiangtao Feng, Zhiyong Wu, Tao Yu, Lingpeng Kong", |
254 | 254 | "publication": "EMNLP 2022", |
|
260 | 260 | "image": "/research/zerogen.jpg" |
261 | 261 | }, |
262 | 262 | { |
263 | | - "category": ["EfficientLLMs", "InteractiveSystems"], |
| 263 | + "category": ["CodeGeneration"], |
264 | 264 | "title": "In-Context Learning for Few-Shot Dialogue State Tracking", |
265 | 265 | "authors": "Yushi Hu, Chia-Hsuan Lee, Tianbao Xie, Tao Yu, Noah A. Smith, Mari Ostendorf", |
266 | 266 | "publication": "EMNLP Findings 2022", |
|
272 | 272 | "image": "/research/ic-dst.jpg" |
273 | 273 | }, |
274 | 274 | { |
275 | | - "category": ["Grounding", "InteractiveSystems"], |
| 275 | + "category": ["DigitalAIAgents"], |
276 | 276 | "title": "NL2INTERFACE: Interactive Visualization Interface Generation from Natural Language Queries", |
277 | 277 | "authors": "Yiru Chen, Ryan Li, Austin Mac, Tianbao Xie, Tao Yu, Eugene Wu", |
278 | 278 | "publication": "IEEE Visualization Conference NLVIZ Workshop 2022", |
|
284 | 284 | "image": "/research/nl2interface.jpg" |
285 | 285 | }, |
286 | 286 | { |
287 | | - "category": ["Grounding"], |
| 287 | + "category": ["CodeGeneration"], |
288 | 288 | "title": "GraPPa: Grammar-Augmented Pre-Training for Table Semantic Parsing", |
289 | 289 | "authors": "Tao Yu, Chien-Sheng Wu, Xi Victoria Lin, Bailin Wang, Yi Chern Tan, Xinyi Yang, Dragomir Radev, Richard Socher, Caiming Xiong", |
290 | 290 | "publication": "ICLR 2021", |
|
296 | 296 | "image": "/research/grappa.jpg" |
297 | 297 | }, |
298 | 298 | { |
299 | | - "category": ["Grounding"], |
| 299 | + "category": ["CodeGeneration"], |
300 | 300 | "title": "Semantic Evaluation for Text-to-SQL with Distilled Test Suites", |
301 | 301 | "authors": "Ruiqi Zhong, Tao Yu, Dan Klein", |
302 | 302 | "publication": "EMNLP 2020", |
|
308 | 308 | "image": "/research/test-suite.jpg" |
309 | 309 | }, |
310 | 310 | { |
311 | | - "category": ["Grounding", "InteractiveSystems"], |
| 311 | + "category": ["CodeGeneration"], |
312 | 312 | "title": "CoSQL: A Conversational Text-to-SQL Challenge Towards Cross-Domain Natural Language Interfaces to Databases", |
313 | 313 | "authors": "Tao Yu, Rui Zhang, Heyang Er, Suyi Li, Eric Xue, Bo Pang, Xi Victoria Lin, Yi Chern Tan, Tianze Shi, Zihan Li, Youxuan Jiang, Michihiro Yasunaga, Sungrok Shim, Tao Chen, Alexander Fabbri, Zifan Li, Luyao Chen, Yuwen Zhang, Shreya Dixit, Vincent Zhang, Caiming Xiong, Richard Socher, Walter Lasecki, Dragomir Radev", |
314 | 314 | "publication": "EMNLP 2019", |
|
320 | 320 | "image": "/research/cosql.jpg" |
321 | 321 | }, |
322 | 322 | { |
323 | | - "category": ["Grounding"], |
| 323 | + "category": ["CodeGeneration"], |
324 | 324 | "title": "SParC: Cross-Domain Semantic Parsing in Context", |
325 | 325 | "authors": "Tao Yu, Rui Zhang, Michihiro Yasunaga, Yi Chern Tan, Xi Victoria Lin, Suyi Li, Heyang Er, Irene Li, Bo Pang, Tao Chen, Emily Ji, Shreya Dixit, David Proctor, Sungrok Shim, Jonathan Kraft, Vincent Zhang, Caiming Xiong, Richard Socher, Dragomir Radev", |
326 | 326 | "publication": "ACL 2018", |
|
332 | 332 | "image": "/research/sparc.jpg" |
333 | 333 | }, |
334 | 334 | { |
335 | | - "category": ["Grounding"], |
| 335 | + "category": ["CodeGeneration"], |
336 | 336 | "title": "Spider: A Large-Scale Human-Labeled Dataset for Complex and Cross-Domain Semantic Parsing and Text-to-SQL Task", |
337 | 337 | "authors": "Tao Yu, Rui Zhang, Kai Yang, Michihiro Yasunaga, Dongxu Wang, Zifan Li, James Ma, Irene Li, Qingning Yao, Shanelle Roman, Zilin Zhang, Dragomir Radev", |
338 | 338 | "publication": "EMNLP 2018", |
|
0 commit comments