update _pages/zh&en/videos.md

VictorChen2002 · VictorChen2002 · commit 3fbe078a25e9 · 2025-07-02T20:26:28.000+02:00
diff --git a/_pages/en/videos.md b/_pages/en/videos.md
@@ -9,15 +9,75 @@ nav_order: 6
 ---
 
 <div align="center">
-<h3> Xmart Student Forum </h3> 
+<h3> Xmart Student Forum </h3>
 
-<h4> Episode 2 </h4> 
+<h4> Session 14 Yuancheng Wang: Towards Natural and Efficient Speech Synthesis — Perspectives on Modeling, Alignment, and Representation</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FuKzzGEq3&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 
-<iframe src="//player.bilibili.com/player.html?bvid=BV1qihreEE6L&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"> </iframe>
+<h4> Session 13 Dongchao Yang: Towards Multi-task Audio Foundation Models — An Audio Generation Perspective</h4>
+<!-- Pending upload -->
 
-<h4> Episode 1 </h4> 
+<h4> Session 12 Junzuo Zhou & Yong Ren: Traceable Protection of Speech — Research on Audio Watermarking</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1EuL7zNEHH&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 
-<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"> </iframe>
+<h4> Session 11 Shengpeng Ji: Opportunities and Challenges in the Era of End-to-End Spoken Dialogue</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FaZGYXEdc&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 10 Ruibin Yuan: Scaling Open Foundation Models for Music</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1rU9EYhEx3&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 9 Shaolei Zhang: Toward Real-time Cross-Language Communication — Challenges, Techniques, and Future of Real-time Speech Models</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV15nwLeaEU1&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 8 Junbin Xiao & Leilei Li: Research and Outlook on First-Person Perspective Problems</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1Ftk1Y6Ehs&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 7 Zirui Guo: From Retrieval-Augmented Generation to Graph-Augmented Generation — Exploring Next-Generation Intelligent Q&A Systems</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV137kJYHEoC&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 6 Haohe Liu: Latent Diffusion Model as a Versatile Coarse-to-Fine Audio Decoder</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1JjmBYYEoW&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 5 Tianbao Xie: OSWorld — Benchmarking Multimodal Agents for Open-Ended Tasks in a Real Computer Environment</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1CpyNYBE6o&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 4 Yuchen Hu: Post-Training Alignment of Large Speech Models</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1uzxeevEb8&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 3 Junyi Ao: SD-Eval New Benchmark — Equipping Large Speech Interaction Models with Cognitive and Emotional Intelligence</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1hixeeqEkQ&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 2 Keqi Deng: Label-synchronous Neural Transducer</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1qihreEE6L&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 1 Dong Zhang: Building End-to-End Spoken Dialogue Large Models</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 </div>
 
+<div align="center">
+<h3> Xmart Frontier Talks </h3>
+
+<h4> Session 7 Kele Xu: Multimodal Machine Learning for Sound Understanding</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1zX9EYZELX&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 6 Cewu Lu: Embodied Intelligence Scaling Laws and Scalable Data</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1hc6JYLE11&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 5 Wenwu Wang: Large Language-Audio Models and Their Applications</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1k7knYgEXT&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 4 Xipeng Qiu: From Large Language Models to World Models</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1AJqGYuEZa&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 3 Tianfan Fu: Applications of Deep Learning in Drug Discovery and Development</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV13XBiYdELy&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 2 Hung-yi Lee: Challenges of Teaching New Skills to Foundation Models</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FsUtY3EQV&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> Session 1 Haofen Wang: Knowledge Retrieval Augmentation — Paradigms and Key Technologies</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+</div>
+
+
 
diff --git a/_pages/zh/videos.md b/_pages/zh/videos.md
@@ -10,13 +10,73 @@ nav_order: 6
 
 
 <div align="center">
-<h3> Xmart学生论坛 </h3> 
+<h3> Xmart学生论坛 </h3>
 
-<h4> 第二期 </h4> 
+<h4> 第十四期 王远程：Towards Natural and Efficient Speech Synthesis: Perspectives on Modeling, Alignment, and Representation</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FuKzzGEq3&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 
-<iframe src="//player.bilibili.com/player.html?bvid=BV1qihreEE6L&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"> </iframe>
+<h4> 第十三期 杨东超：Towards Multi-task Audio Foundation Models: An Audio Generation Perspective</h4>
+<!-- 待上传 -->
 
-<h4> 第一期 </h4> 
+<h4> 第十二期 周俊佐、任勇：语音的可溯源保护：音频水印研究</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1EuL7zNEHH&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 
-<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"> </iframe>
+<h4> 第十一期 季圣鹏：端到端语音对话时代的机遇和挑战</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FaZGYXEdc&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第十期 袁锐斌：Scaling Open Foundation Models for Music</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1rU9EYhEx3&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第九期 张绍磊：迈向实时跨语言沟通：实时语音模型的挑战、技术和未来</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV15nwLeaEU1&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第八期 肖俊斌、李磊磊：面向第一视角的问题研究与展望</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1Ftk1Y6Ehs&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第七期 郭子睿：从检索增强生成到图增强生成：探索新一代智能问答系统</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV137kJYHEoC&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第六期 刘濠赫：Latent Diffusion Model as a Versatile Coarse-to-Fine Audio Decoder</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1JjmBYYEoW&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第五期 谢天宝：OSWorld：在真实计算机环境中对开放式任务进行多模态智能体基准测试</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1CpyNYBE6o&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第四期 胡宇晨：语音大模型的后训练对齐</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1uzxeevEb8&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第三期 敖君逸：SD-Eval 新基准，让语音交互大模型情智兼备</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1hixeeqEkQ&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第二期 邓克琦：Label-synchronous Neural Transducer</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1qihreEE6L&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第一期 张栋：构造端到端语音对话大模型</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
 </div>
+
+<div align="center">
+<h3> Xmart 前沿讲坛 </h3>
+
+<h4> 第七期 许可乐：面向声音理解的多模态机器学习</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1zX9EYZELX&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第六期 卢策吾：具身智能 scaling law 与可规模化数据</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1hc6JYLE11&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第五期 王文武：大型语言-音频模型及其应用</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1k7knYgEXT&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第四期 邱锡鹏：从大语言模型到世界模型</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1AJqGYuEZa&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第三期 符天凡：深度学习在药物发现和开发中的应用</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV13XBiYdELy&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第二期 李宏毅：将新技能教给基础模型的挑战</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FsUtY3EQV&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+
+<h4> 第一期 王昊奋：知识检索增强：范式与关键技术</h4>
+<iframe src="//player.bilibili.com/player.html?bvid=BV1FJ4m137ZB&page=1" scrolling="no" border="0" frameborder="no" framespacing="0" allowfullscreen="true" width="100%" height="500"></iframe>
+</div>
+