From 81885945dc991d3960b4bec9e61ec6d75d39e124 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Thu, 6 Nov 2025 22:35:34 +0100
Subject: [PATCH 01/19] Add explicit id for all Lei Li author mentions

Catch-all id for now
---
 data/xml/2020.acl.xml         |  4 ++--
 data/xml/2020.emnlp.xml       |  6 +++---
 data/xml/2020.findings.xml    |  4 ++--
 data/xml/2020.fnp.xml         |  2 +-
 data/xml/2020.sdp.xml         |  2 +-
 data/xml/2020.wmt.xml         |  4 ++--
 data/xml/2021.acl.xml         | 18 +++++++++---------
 data/xml/2021.eacl.xml        |  2 +-
 data/xml/2021.emnlp.xml       | 10 +++++-----
 data/xml/2021.findings.xml    | 20 ++++++++++----------
 data/xml/2021.iwslt.xml       |  2 +-
 data/xml/2021.naacl.xml       | 12 ++++++------
 data/xml/2021.wmt.xml         |  2 +-
 data/xml/2022.aacl.xml        |  2 +-
 data/xml/2022.acl.xml         | 12 ++++++------
 data/xml/2022.coling.xml      |  4 ++--
 data/xml/2022.emnlp.xml       |  4 ++--
 data/xml/2022.findings.xml    | 24 ++++++++++++------------
 data/xml/2022.iwslt.xml       |  2 +-
 data/xml/2022.naacl.xml       |  4 ++--
 data/xml/2023.acl.xml         | 10 +++++-----
 data/xml/2023.americasnlp.xml |  2 +-
 data/xml/2023.emnlp.xml       | 10 +++++-----
 data/xml/2023.findings.xml    | 16 ++++++++--------
 data/xml/2023.ijcnlp.xml      |  2 +-
 data/xml/2024.acl.xml         | 12 ++++++------
 data/xml/2024.ccl.xml         |  2 +-
 data/xml/2024.emnlp.xml       | 12 ++++++------
 data/xml/2024.findings.xml    | 20 ++++++++++----------
 data/xml/2024.iwslt.xml       |  4 ++--
 data/xml/2024.lrec.xml        |  4 ++--
 data/xml/2024.naacl.xml       |  2 +-
 data/xml/2025.acl.xml         | 10 +++++-----
 data/xml/2025.coling.xml      |  2 +-
 data/xml/2025.emnlp.xml       |  6 +++---
 data/xml/2025.findings.xml    | 18 +++++++++---------
 data/xml/2025.iwslt.xml       |  2 +-
 data/xml/2025.naacl.xml       | 10 +++++-----
 data/xml/D18.xml              |  2 +-
 data/xml/D19.xml              |  6 +++---
 data/xml/K19.xml              |  2 +-
 data/xml/N18.xml              |  2 +-
 data/xml/P16.xml              |  2 +-
 data/xml/P19.xml              | 12 ++++++------
 data/xml/W13.xml              |  4 ++--
 data/xml/W14.xml              |  2 +-
 data/xml/W16.xml              |  2 +-
 data/xml/W17.xml              |  4 ++--
 data/xml/W19.xml              |  4 ++--
 data/xml/Y06.xml              |  2 +-
 data/yaml/name_variants.yaml  |  3 +++
 51 files changed, 167 insertions(+), 164 deletions(-)
diff --git a/data/xml/2020.acl.xml b/data/xml/2020.acl.xml
index f7e4e32899..3918997eda 100644
--- a/data/xml/2020.acl.xml
+++ b/data/xml/2020.acl.xml
@@ -4234,7 +4234,7 @@
       <author><first>Ning</first><last>Miao</last></author>
       <author><first>Yuxuan</first><last>Song</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3436–3441</pages>
       <abstract>It has been a common approach to pre-train a language model on a large corpus and fine-tune it on task-specific data. In practice, we observe that fine-tuning a pre-trained model on a small dataset may lead to over- and/or under-estimate problem. In this paper, we propose MC-Tailor, a novel method to alleviate the above issue in text generation tasks by truncating and transferring the probability mass from over-estimated regions to under-estimated ones. Experiments on a variety of text generation datasets show that MC-Tailor consistently and significantly outperforms the fine-tuning approach.</abstract>
       <url hash="5c7e1235">2020.acl-main.314</url>
@@ -10481,7 +10481,7 @@
       <author><first>Xijin</first><last>Zhang</last></author>
       <author><first>Songcheng</first><last>Jiang</last></author>
       <author><first>Yuxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>1–8</pages>
       <abstract>This paper proposes the building of Xiaomingbot, an intelligent, multilingual and multimodal software robot equipped with four inte- gral capabilities: news generation, news translation, news reading and avatar animation. Its system summarizes Chinese news that it automatically generates from data tables. Next, it translates the summary or the full article into multiple languages, and reads the multi- lingual rendition through synthesized speech. Notably, Xiaomingbot utilizes a voice cloning technology to synthesize the speech trained from a real person’s voice data in one input language. The proposed system enjoys several merits: it has an animated avatar, and is able to generate and read multilingual news. Since it was put into practice, Xiaomingbot has written over 600,000 articles, and gained over 150,000 followers on social media platforms.</abstract>
       <url hash="a9a9e7e8">2020.acl-demos.1</url>
diff --git a/data/xml/2020.emnlp.xml b/data/xml/2020.emnlp.xml
index 1bf9ab29c4..74ace32d5f 100644
--- a/data/xml/2020.emnlp.xml
+++ b/data/xml/2020.emnlp.xml
@@ -1707,7 +1707,7 @@
       <author><first>Shuang</first><last>Zeng</last></author>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>1630–1640</pages>
       <abstract>Document-level relation extraction aims to extract relations among entities within a document. Different from sentence-level relation extraction, it requires reasoning over multiple sentences across paragraphs. In this paper, we propose Graph Aggregation-and-Inference Network (GAIN), a method to recognize such relations for long paragraphs. GAIN constructs two graphs, a heterogeneous mention-level graph (MG) and an entity-level graph (EG). The former captures complex interaction among different mentions and the latter aggregates mentions underlying for the same entities. Based on the graphs we propose a novel path reasoning mechanism to infer relations between entities. Experiments on the public dataset, DocRED, show GAIN achieves a significant performance improvement (2.85 on F1) over the previous state-of-the-art. Our code is available at <url>https://github.com/PKUnlp-icler/GAIN</url>.</abstract>
       <url hash="f205ef83">2020.emnlp-main.127</url>
@@ -2836,7 +2836,7 @@
       <author><first>Xipeng</first><last>Qiu</last></author>
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2649–2663</pages>
       <abstract>We investigate the following question for machine translation (MT): can we develop a single universal MT model to serve as the common seed and obtain derivative and improved models on arbitrary language pairs? We propose mRASP, an approach to pre-train a universal multilingual neural machine translation model. Our key idea in mRASP is its novel technique of random aligned substitution, which brings words and phrases with similar meanings across multiple languages closer in the representation space. We pre-train a mRASP model on 32 language pairs jointly with only public datasets. The model is then fine-tuned on downstream language pairs to obtain specialized MT models. We carry out extensive experiments on 42 translation directions across a diverse settings, including low, medium, rich resource, and as well as transferring to exotic language pairs. Experimental results demonstrate that mRASP achieves significant performance improvement compared to directly training on those target pairs. It is the first time to verify that multiple lowresource language pairs can be utilized to improve rich resource MT. Surprisingly, mRASP is even able to improve the translation quality on exotic languages that never occur in the pretraining corpus. Code, data, and pre-trained models are available at <url>https://github.com/linzehui/mRASP</url>.</abstract>
       <url hash="a0f25581">2020.emnlp-main.210</url>
@@ -9842,7 +9842,7 @@
       <author><first>Junxian</first><last>He</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Yiming</first><last>Yang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>9119–9130</pages>
       <abstract>Pre-trained contextual representations like BERT have achieved great success in natural language processing. However, the sentence embeddings from the pre-trained language models without fine-tuning have been found to poorly capture semantic meaning of sentences. In this paper, we argue that the semantic information in the BERT embeddings is not fully exploited. We first reveal the theoretical connection between the masked language model pre-training objective and the semantic similarity task theoretically, and then analyze the BERT sentence embeddings empirically. We find that BERT always induces a non-smooth anisotropic semantic space of sentences, which harms its performance of semantic similarity. To address this issue, we propose to transform the anisotropic sentence embedding distribution to a smooth and isotropic Gaussian distribution through normalizing flows that are learned with an unsupervised objective. Experimental results show that our proposed BERT-flow method obtains significant performance gains over the state-of-the-art sentence embeddings on a variety of semantic textual similarity tasks. The code is available at <url>https://github.com/bohanli/BERT-flow</url>.</abstract>
       <url hash="b156fa71">2020.emnlp-main.733</url>
diff --git a/data/xml/2020.findings.xml b/data/xml/2020.findings.xml
index 2382fc6635..28c4cdd206 100644
--- a/data/xml/2020.findings.xml
+++ b/data/xml/2020.findings.xml
@@ -1465,7 +1465,7 @@
       <title>Language Generation via Combinatorial Constraint Satisfaction: A Tree Search Enhanced <fixed-case>M</fixed-case>onte-<fixed-case>C</fixed-case>arlo Approach</title>
       <author><first>Maosen</first><last>Zhang</last></author>
       <author><first>Nan</first><last>Jiang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yexiang</first><last>Xue</last></author>
       <pages>1286–1298</pages>
       <abstract>Generating natural language under complex constraints is a principled formulation towards controllable text generation. We present a framework to allow specification of combinatorial constraints for sentence generation. We propose TSMC, an efficient method to generate high likelihood sentences with respect to a pre-trained language model while satisfying the constraints. Our approach is highly flexible, requires no task-specific train- ing, and leverages efficient constraint satisfaction solving techniques. To better handle the combinatorial constraints, a tree search algorithm is embedded into the proposal process of the Markov Chain Monte Carlo (MCMC) to explore candidates that satisfy more constraints. Compared to existing MCMC approaches, our sampling approach has a better mixing performance. Experiments show that TSMC achieves consistent and significant improvement on multiple language generation tasks.</abstract>
@@ -5726,7 +5726,7 @@
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>4908–4917</pages>
       <abstract>Active learning for sentence understanding aims at discovering informative unlabeled data for annotation and therefore reducing the demand for labeled data. We argue that the typical uncertainty sampling method for active learning is time-consuming and can hardly work in real-time, which may lead to ineffective sample selection. We propose adversarial uncertainty sampling in discrete space (AUSDS) to retrieve informative unlabeled samples more efficiently. AUSDS maps sentences into latent space generated by the popular pre-trained language models, and discover informative unlabeled text samples for annotation via adversarial attack. The proposed approach is extremely efficient compared with traditional uncertainty sampling with more than 10x speedup. Experimental results on five datasets show that AUSDS outperforms strong baselines on effectiveness.</abstract>
       <url hash="a49de01f">2020.findings-emnlp.441</url>
diff --git a/data/xml/2020.fnp.xml b/data/xml/2020.fnp.xml
index 3752fcbd16..30cff5edd3 100644
--- a/data/xml/2020.fnp.xml
+++ b/data/xml/2020.fnp.xml
@@ -194,7 +194,7 @@
     </paper>
     <paper id="17">
       <title>Extractive Financial Narrative Summarisation based on <fixed-case>DPP</fixed-case>s</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yafei</first><last>Jiang</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
       <pages>100–104</pages>
diff --git a/data/xml/2020.sdp.xml b/data/xml/2020.sdp.xml
index db6adb6692..5d198dd20d 100644
--- a/data/xml/2020.sdp.xml
+++ b/data/xml/2020.sdp.xml
@@ -349,7 +349,7 @@
     </paper>
     <paper id="25">
       <title><fixed-case>CIST</fixed-case>@<fixed-case>CL</fixed-case>-<fixed-case>S</fixed-case>ci<fixed-case>S</fixed-case>umm 2020, <fixed-case>L</fixed-case>ong<fixed-case>S</fixed-case>umm 2020: Automatic Scientific Document Summarization</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yang</first><last>Xie</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
diff --git a/data/xml/2020.wmt.xml b/data/xml/2020.wmt.xml
index 9613f9566f..56f716fc66 100644
--- a/data/xml/2020.wmt.xml
+++ b/data/xml/2020.wmt.xml
@@ -471,7 +471,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Yaoming</first><last>Zhu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>305–312</pages>
       <abstract>This paper describes our submission systems for VolcTrans for WMT20 shared news translation task. We participated in 8 translation directions. Our basic systems are based on Transformer (CITATION), into which we also employed new architectures (bigger or deeper Transformers, dynamic convolution). The final systems include text pre-process, subword(a.k.a. BPE(CITATION)), baseline model training, iterative back-translation, model ensemble, knowledge distillation and multilingual pre-training.</abstract>
       <url hash="58264a1d">2020.wmt-1.33</url>
@@ -1443,7 +1443,7 @@
       <author><first>Zhuo</first><last>Zhi</last></author>
       <author><first>Jun</first><last>Cao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>985–990</pages>
       <abstract>In this paper, we describe our submissions to the WMT20 shared task on parallel corpus filtering and alignment for low-resource conditions. The task requires the participants to align potential parallel sentence pairs out of the given document pairs, and score them so that low-quality pairs can be filtered. Our system, Volctrans, is made of two modules, i.e., a mining module and a scoring module. Based on the word alignment model, the mining mod- ule adopts an iterative mining strategy to extract latent parallel sentences. In the scoring module, an XLM-based scorer provides scores, followed by reranking mechanisms and ensemble. Our submissions outperform the baseline by 3.x/2.x and 2.x/2.x for km-en and ps-en on From Scratch/Fine-Tune conditions.</abstract>
       <url hash="98a59e41">2020.wmt-1.112</url>
diff --git a/data/xml/2021.acl.xml b/data/xml/2021.acl.xml
index f6dfd817ee..c2467d6434 100644
--- a/data/xml/2021.acl.xml
+++ b/data/xml/2021.acl.xml
@@ -284,7 +284,7 @@
       <author><first>Changzhi</first><last>Sun</last></author>
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Junchi</first><last>Yan</last></author>
       <pages>220–231</pages>
       <abstract>Many joint entity relation extraction models setup two separated label spaces for the two sub-tasks (i.e., entity detection and relation classification). We argue that this setting may hinder the information interaction between entities and relations. In this work, we propose to eliminate the different treatment on the two sub-tasks’ label spaces. The input of our model is a table containing all word pairs from a sentence. Entities and relations are represented by squares and rectangles in the table. We apply a unified classifier to predict each cell’s label, which unifies the learning of two sub-tasks. For testing, an effective (yet fast) approximate decoder is proposed for finding squares and rectangles from tables. Experiments on three benchmarks (ACE04, ACE05, SciERC) show that, using only half the number of parameters, our model achieves competitive accuracy with the best extractor, and is faster.</abstract>
@@ -315,7 +315,7 @@
       <author><first>Xiao</first><last>Pan</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Liwei</first><last>Wu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>244–258</pages>
       <abstract>Existing multilingual machine translation approaches mainly focus on English-centric directions, while the non-English directions still lag behind. In this work, we aim to build a many-to-many translation system with an emphasis on the quality of non-English language directions. Our intuition is based on the hypothesis that a universal cross-language representation leads to better multilingual translation performance. To this end, we propose mRASP2, a training method to obtain a single unified multilingual translation model. mRASP2 is empowered by two techniques: a) a contrastive learning scheme to close the gap among representations of different languages, and b) data augmentation on both multiple parallel and monolingual data to further align token representations. For English-centric directions, mRASP2 achieves competitive or even better performance than a strong pre-trained model mBART on tens of WMT benchmarks. For non-English directions, mRASP2 achieves an improvement of average 10+ BLEU compared with the multilingual baseline</abstract>
       <url hash="359e1df2">2021.acl-long.21</url>
@@ -364,7 +364,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Liwei</first><last>Wu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>293–305</pages>
       <abstract>Multilingual neural machine translation aims at learning a single translation model for multiple languages. These jointly trained models often suffer from performance degradationon rich-resource language pairs. We attribute this degeneration to parameter interference. In this paper, we propose LaSS to jointly train a single unified multilingual MT model. LaSS learns Language Specific Sub-network (LaSS) for each language pair to counter parameter interference. Comprehensive experiments on IWSLT and WMT datasets with various Transformer architectures show that LaSS obtains gains on 36 language pairs by up to 1.2 BLEU. Besides, LaSS shows its strong generalization performance at easy adaptation to new language pairs and zero-shot translation. LaSS boosts zero-shot translation with an average of 8.3 BLEU on 30 language pairs. Codes and trained models are available at <url>https://github.com/NLP-Playground/LaSS</url>.</abstract>
       <url hash="37c63029">2021.acl-long.25</url>
@@ -2163,7 +2163,7 @@
       <author><first>Lin</first><last>Qiu</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>1993–2003</pages>
       <abstract>Recent work on non-autoregressive neural machine translation (NAT) aims at improving the efficiency by parallel decoding without sacrificing the quality. However, existing NAT methods are either inferior to Transformer or require multiple decoding passes, leading to reduced speedup. We propose the Glancing Language Model (GLM) for single-pass parallel generation models. With GLM, we develop Glancing Transformer (GLAT) for machine translation. With only single-pass parallel decoding, GLAT is able to generate high-quality translation with 8×-15× speedup. Note that GLAT does not modify the network architecture, which is a training method to learn word interdependency. Experiments on multiple WMT language directions show that GLAT outperforms all previous single pass non-autoregressive methods, and is nearly comparable to Transformer, reducing the gap to 0.25-0.9 BLEU points.</abstract>
       <url hash="82fe2afd">2021.acl-long.155</url>
@@ -3869,7 +3869,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <title>Document-level Event Extraction via Heterogeneous Graph-based Interaction Model with a Tracker</title>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
       <pages>3533–3546</pages>
       <abstract>Document-level event extraction aims to recognize event information from a whole piece of article. Existing methods are not effective due to two challenges of this task: a) the target event arguments are scattered across sentences; b) the correlation among events in a document is non-trivial to model. In this paper, we propose Heterogeneous Graph-based Interaction Model with a Tracker (GIT) to solve the aforementioned two challenges. For the first challenge, GIT constructs a heterogeneous graph interaction network to capture global interactions among different sentences and entity mentions. For the second, GIT introduces a Tracker module to track the extracted events and hence capture the interdependency among the events. Experiments on a large-scale dataset (Zheng et al, 2019) show GIT outperforms the previous methods by 2.8 F1. Further analysis reveals is effective in extracting multiple correlated events and event arguments that scatter across the document.</abstract>
@@ -5370,7 +5370,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
     </paper>
     <paper id="383">
       <title>Personalized Transformer for Explainable Recommendation</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <author><first>Li</first><last>Chen</last></author>
       <pages>4947–4957</pages>
@@ -7997,7 +7997,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Chun</first><last>Gan</last></author>
       <author><first>Zaixiang</first><last>Zheng</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>7361–7373</pages>
       <abstract>The choice of token vocabulary affects the performance of machine translation. This paper aims to figure out what is a good vocabulary and whether we can find the optimal vocabulary without trial training. To answer these questions, we first provide an alternative understanding of vocabulary from the perspective of information theory. It motivates us to formulate the quest of vocabularization – finding the best token dictionary with a proper size – as an optimal transport (OT) problem. We propose VOLT, a simple and efficient solution without trial training. Empirical results show that VOLT beats widely-used vocabularies in diverse scenarios, including WMT-14 English-German translation, TED bilingual translation, and TED multilingual translation. For example, VOLT achieves 70% vocabulary size reduction and 0.5 BLEU gain on English-German translation. Also, compared to BPE-search, VOLT reduces the search time from 384 GPU hours to 30 GPU hours on English-German translation. Codes are available at <url>https://github.com/Jingjing-NLP/VOLT</url>.</abstract>
       <url hash="bd59504c">2021.acl-long.571</url>
@@ -10453,7 +10453,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Qianqian</first><last>Dong</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>55–62</pages>
       <abstract>NeurST is an open-source toolkit for neural speech translation. The toolkit mainly focuses on end-to-end speech translation, which is easy to use, modify, and extend to advanced speech translation research and products. NeurST aims at facilitating the speech translation research for NLP researchers and building reliable benchmarks for this field. It provides step-by-step recipes for feature extraction, data preprocessing, distributed training, and evaluation. In this paper, we will introduce the framework design of NeurST and show experimental results for different benchmark datasets, which can be regarded as reliable baselines for future research. The toolkit is publicly available at <url>https://github.com/bytedance/neurst</url> and we will continuously update the performance of with other counterparts and studies at <url>https://st-benchmark.github.io/</url>.</abstract>
       <url hash="c0a0080b">2021.acl-demo.7</url>
@@ -11081,7 +11081,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
     <paper id="4">
       <title>Pre-training Methods for Neural Machine Translation</title>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>21–25</pages>
       <abstract>This tutorial provides a comprehensive guide to make the most of pre-training for neural machine translation. Firstly, we will briefly introduce the background of NMT, pre-training methodology, and point out the main challenges when applying pre-training for NMT. Then we will focus on analysing the role of pre-training in enhancing the performance of NMT, how to design a better pre-training model for executing specific NMT tasks and how to better integrate the pre-trained model into NMT system. In each part, we will provide examples, discuss training techniques and analyse what is transferred when applying pre-training.</abstract>
       <url hash="bae9900f">2021.acl-tutorials.4</url>
diff --git a/data/xml/2021.eacl.xml b/data/xml/2021.eacl.xml
index c48bdfa284..5cc30f41bc 100644
--- a/data/xml/2021.eacl.xml
+++ b/data/xml/2021.eacl.xml
@@ -3008,7 +3008,7 @@
       <author><first>Changzhi</first><last>Sun</last></author>
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Junchi</first><last>Yan</last></author>
       <pages>2877–2887</pages>
       <abstract>Current state-of-the-art systems for joint entity relation extraction (Luan et al., 2019; Wad-den et al., 2019) usually adopt the multi-task learning framework. However, annotations for these additional tasks such as coreference resolution and event extraction are always equally hard (or even harder) to obtain. In this work, we propose a pre-training method ENPAR to improve the joint extraction performance. ENPAR requires only the additional entity annotations that are much easier to collect. Unlike most existing works that only consider incorporating entity information into the sentence encoder, we further utilize the entity pair information. Specifically, we devise four novel objectives,i.e., masked entity typing, masked entity prediction, adversarial context discrimination, and permutation prediction, to pre-train an entity encoder and an entity pair encoder. Comprehensive experiments show that the proposed pre-training method achieves significant improvement over BERT on ACE05, SciERC, and NYT, and outperforms current state-of-the-art on ACE05.</abstract>
diff --git a/data/xml/2021.emnlp.xml b/data/xml/2021.emnlp.xml
index e7faac1620..c2f1fe5fb3 100644
--- a/data/xml/2021.emnlp.xml
+++ b/data/xml/2021.emnlp.xml
@@ -432,7 +432,7 @@
     </paper>
     <paper id="31">
       <title>Dynamic Knowledge Distillation for Pre-trained Language Models</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yankai</first><last>Lin</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
       <author><first>Peng</first><last>Li</last></author>
@@ -1301,7 +1301,7 @@
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>1239–1250</pages>
       <abstract>Document-level relation extraction aims to identify relations between entities in a whole document. Prior efforts to capture long-range dependencies have relied heavily on implicitly powerful representations learned through (graph) neural networks, which makes the model less transparent. To tackle this challenge, in this paper, we propose LogiRE, a novel probabilistic model for document-level relation extraction by learning logic rules. LogiRE treats logic rules as latent variables and consists of two modules: a rule generator and a relation extractor. The rule generator is to generate logic rules potentially contributing to final predictions, and the relation extractor outputs final predictions based on the generated logic rules. Those two modules can be efficiently optimized with the expectation-maximization (EM) algorithm. By introducing logic rules into neural networks, LogiRE can explicitly capture long-range dependencies as well as enjoy better interpretation. Empirical results show that significantly outperforms several strong baselines in terms of relation performance and logical consistency. Our code is available at <url>https://github.com/rudongyu/LogiRE</url>.</abstract>
       <url hash="e34e0708">2021.emnlp-main.95</url>
@@ -4705,7 +4705,7 @@
       <author><first>Zhiyuan</first><last>Zeng</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Weiran</first><last>Xu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>4102–4108</pages>
       <abstract>Neural abstractive summarization systems have gained significant progress in recent years. However, abstractive summarization often produce inconsisitent statements or false facts. How to automatically generate highly abstract yet factually correct summaries? In this paper, we proposed an efficient weak-supervised adversarial data augmentation approach to form the factual consistency dataset. Based on the artificial dataset, we train an evaluation model that can not only make accurate and robust factual consistency discrimination but is also capable of making interpretable factual errors tracing by backpropagated gradient distribution on token embeddings. Experiments and analysis conduct on public annotated summarization and factual consistency datasets demonstrate our approach effective and reasonable.</abstract>
       <url hash="fef4caa7">2021.emnlp-main.337</url>
@@ -7934,7 +7934,7 @@
       <author><first>Jun</first><last>Cao</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>7280–7290</pages>
       <abstract>How to effectively adapt neural machine translation (NMT) models according to emerging cases without retraining? Despite the great success of neural machine translation, updating the deployed models online remains a challenge. Existing non-parametric approaches that retrieve similar examples from a database to guide the translation process are promising but are prone to overfit the retrieved examples. However, non-parametric methods are prone to overfit the retrieved examples. In this work, we propose to learn Kernel-Smoothed Translation with Example Retrieval (KSTER), an effective approach to adapt neural machine translation models online. Experiments on domain adaptation and multi-domain machine translation datasets show that even without expensive retraining, KSTER is able to achieve improvement of 1.1 to 1.5 BLEU scores over the best existing online adaptation methods. The code and trained models are released at <url>https://github.com/jiangqn/KSTER</url>.</abstract>
       <url hash="09faadd8">2021.emnlp-main.579</url>
@@ -9717,7 +9717,7 @@
       <title>Text <fixed-case>A</fixed-case>uto<fixed-case>A</fixed-case>ugment: Learning Compositional Augmentation Policy for Text Classification</title>
       <author><first>Shuhuai</first><last>Ren</last></author>
       <author><first>Jinchao</first><last>Zhang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Xu</first><last>Sun</last></author>
       <author><first>Jie</first><last>Zhou</last></author>
       <pages>9029–9043</pages>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index 5b0b476fb0..29c781856a 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -925,7 +925,7 @@
       <title><fixed-case>U</fixed-case>ni<fixed-case>K</fixed-case>eyphrase: A Unified Extraction and Generation Framework for Keyphrase Prediction</title>
       <author><first>Huanqin</first><last>Wu</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Dan</first><last>Nie</last></author>
       <author><first>Tao</first><last>Chen</last></author>
       <author><first>Feng</first><last>Zhang</last></author>
@@ -2444,7 +2444,7 @@
       <author><first>Chi</first><last>Han</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Heng</first><last>Ji</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2214–2225</pages>
       <url hash="9ca4228f">2021.findings-acl.195</url>
       <doi>10.18653/v1/2021.findings-acl.195</doi>
@@ -3026,7 +3026,7 @@
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Xipeng</first><last>Qiu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2739–2750</pages>
       <url hash="467059aa">2021.findings-acl.242</url>
       <doi>10.18653/v1/2021.findings-acl.242</doi>
@@ -3300,7 +3300,7 @@
       <author><first>Liwei</first><last>Wu</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3001–3007</pages>
       <url hash="66d3d754">2021.findings-acl.264</url>
       <doi>10.18653/v1/2021.findings-acl.264</doi>
@@ -3464,7 +3464,7 @@
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3140–3151</pages>
       <url hash="4337b7fe">2021.findings-acl.277</url>
       <doi>10.18653/v1/2021.findings-acl.277</doi>
@@ -6240,7 +6240,7 @@
     </paper>
     <paper id="43">
       <title><fixed-case>C</fixed-case>ascade<fixed-case>BERT</fixed-case>: Accelerating Inference of Pre-trained Language Models via Calibrated Complete Models Cascade</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yankai</first><last>Lin</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
@@ -6725,7 +6725,7 @@
     <paper id="78">
       <title>Leveraging Word-Formation Knowledge for <fixed-case>C</fixed-case>hinese Word Sense Disambiguation</title>
       <author><first>Hua</first><last>Zheng</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
@@ -8770,7 +8770,7 @@
       <title>Multilingual Translation via Grafting Pre-trained Language Models</title>
       <author><first>Zewei</first><last>Sun</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2735–2747</pages>
       <abstract>Can pre-trained BERT for one language and GPT for another be glued together to translate texts? Self-supervised training using only monolingual data has led to the success of pre-trained (masked) language models in many NLP tasks. However, directly connecting BERT as an encoder and GPT as a decoder can be challenging in machine translation, for GPT-like models lack a cross-attention component that is needed in seq2seq decoders. In this paper, we propose Graformer to graft separately pre-trained (masked) language models for machine translation. With monolingual data for pre-training and parallel data for grafting training, we maximally take advantage of the usage of both types of data. Experiments on 60 directions show that our method achieves average improvements of 5.8 BLEU in x2en and 2.9 BLEU in en2x directions comparing with the multilingual Transformer of the same size.</abstract>
       <url hash="80fa5c0d">2021.findings-emnlp.233</url>
@@ -8864,7 +8864,7 @@
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2812–2823</pages>
       <abstract>Developing a unified multilingual model has been a long pursuing goal for machine translation. However, existing approaches suffer from performance degradation - a single multilingual model is inferior to separately trained bilingual ones on rich-resource languages. We conjecture that such a phenomenon is due to interference brought by joint training with multiple languages. To accommodate the issue, we propose CIAT, an adapted Transformer model with a small parameter overhead for multilingual machine translation. We evaluate CIAT on multiple benchmark datasets, including IWSLT, OPUS-100, and WMT. Experiments show that the CIAT consistently outperforms strong multilingual baselines on 64 of total 66 language directions, 42 of which have above 0.5 BLEU improvement.</abstract>
       <url hash="9676bc16">2021.findings-emnlp.240</url>
@@ -10963,7 +10963,7 @@
       <author><first>Tao</first><last>Wang</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Hang</first><last>Li</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
       <pages>4639–4644</pages>
diff --git a/data/xml/2021.iwslt.xml b/data/xml/2021.iwslt.xml
index e4e7f0c7c5..6582fc3c5b 100644
--- a/data/xml/2021.iwslt.xml
+++ b/data/xml/2021.iwslt.xml
@@ -110,7 +110,7 @@
       <author><first>Rong</first><last>Ye</last></author>
       <author><first>Qianqian</first><last>Dong</last></author>
       <author><first>Jun</first><last>Cao</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>64–74</pages>
       <abstract>This paper describes the systems submitted to IWSLT 2021 by the Volctrans team. We participate in the offline speech translation and text-to-text simultaneous translation tracks. For offline speech translation, our best end-to-end model achieves 7.9 BLEU improvements over the benchmark on the MuST-C test set and is even approaching the results of a strong cascade solution. For text-to-text simultaneous translation, we explore the best practice to optimize the wait-k model. As a result, our final submitted systems exceed the benchmark at around 7 BLEU on the same latency regime. We release our code and model to facilitate both future research works and industrial applications.</abstract>
       <url hash="5d4dfb8f">2021.iwslt-1.6</url>
diff --git a/data/xml/2021.naacl.xml b/data/xml/2021.naacl.xml
index e10381b920..d36faa17ca 100644
--- a/data/xml/2021.naacl.xml
+++ b/data/xml/2021.naacl.xml
@@ -2243,7 +2243,7 @@
     <paper id="165">
       <title>Be Careful about Poisoned Word Embeddings: Exploring the Vulnerability of the Embedding Layers in <fixed-case>NLP</fixed-case> Models</title>
       <author><first>Wenkai</first><last>Yang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Zhiyuan</first><last>Zhang</last></author>
       <author><first>Xuancheng</first><last>Ren</last></author>
       <author><first>Xu</first><last>Sun</last></author>
@@ -5884,7 +5884,7 @@
       <title>Decompose, Fuse and Generate: A Formation-Informed Method for <fixed-case>C</fixed-case>hinese Definition Generation</title>
       <author><first>Hua</first><last>Zheng</last></author>
       <author><first>Damai</first><last>Dai</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Zhifang</first><last>Sui</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
@@ -6173,7 +6173,7 @@
       <title>Generative Imagination Elevates Machine Translation</title>
       <author><first>Quanyu</first><last>Long</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>5738–5748</pages>
       <abstract>There are common semantics shared across text and images. Given a sentence in a source language, whether depicting the visual scene helps translation into a target language? Existing multimodal neural machine translation methods (MNMT) require triplets of bilingual sentence - image for training and tuples of source sentence - image for inference. In this paper, we propose ImagiT, a novel machine translation method via visual imagination. ImagiT first learns to generate visual representation from the source sentence, and then utilizes both source sentence and the “imagined representation” to produce a target translation. Unlike previous methods, it only needs the source sentence at the inference time. Experiments demonstrate that ImagiT benefits from visual imagination and significantly outperforms the text-only neural machine translation baselines. Further analysis reveals that the imagination process in ImagiT helps fill in missing information when performing the degradation strategy.</abstract>
       <url hash="2a5a5564">2021.naacl-main.457</url>
@@ -7335,7 +7335,7 @@
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Hongxiao</first><last>Bai</last></author>
       <author><first>Hai</first><last>Zhao</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>89–96</pages>
       <abstract>We propose to improve unsupervised neural machine translation with cross-lingual supervision (), which utilizes supervision signals from high resource language pairs to improve the translation of zero-source languages. Specifically, for training En-Ro system without parallel corpus, we can leverage the corpus from En-Fr and En-De to collectively train the translation from one language into many languages under one model. % is based on multilingual models which require no changes to the standard unsupervised NMT. Simple and effective, significantly improves the translation quality with a big margin in the benchmark unsupervised translation tasks, and even achieves comparable performance to supervised NMT. In particular, on WMT’14 -tasks achieves 37.6 and 35.18 BLEU score, which is very close to the large scale supervised setting and on WMT’16 -tasks achieves 35.09 BLEU score which is even better than the supervised Transformer baseline.</abstract>
       <url hash="83973cc2">2021.naacl-industry.12</url>
@@ -7361,7 +7361,7 @@
       <author><first>Tao</first><last>Wang</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
       <pages>105–112</pages>
       <abstract>Automatic translation of dialogue texts is a much needed demand in many real life scenarios. However, the currently existing neural machine translation delivers unsatisfying results. In this paper, we conduct a deep analysis of a dialogue corpus and summarize three major issues on dialogue translation, including pronoun dropping (), punctuation dropping (), and typos (). In response to these challenges, we propose a joint learning method to identify omission and typo, and utilize context to translate dialogue utterances. To properly evaluate the performance, we propose a manually annotated dataset with 1,931 Chinese-English parallel utterances from 300 dialogues as a benchmark testbed for dialogue translation. Our experiments show that the proposed method improves translation quality by 3.2 BLEU over the baselines. It also elevates the recovery rate of omitted pronouns from 26.09% to 47.16%. We will publish the code and dataset publicly at https://xxx.xx.</abstract>
@@ -7376,7 +7376,7 @@
       <author><first>Ying</first><last>Xiong</last></author>
       <author><first>Yang</first><last>Wei</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>113–120</pages>
       <abstract>Transformer and its variants have achieved great success in natural language processing. Since Transformer models are huge in size, serving these models is a challenge for real industrial applications. In this paper, we propose , a highly efficient inference library for models in the Transformer family. includes a series of GPU optimization techniques to both streamline the computation of Transformer layers and reduce memory footprint. supports models trained using PyTorch and Tensorflow. Experimental results on standard machine translation benchmarks show that achieves up to 14x speedup compared with TensorFlow and 1.4x speedup compared with , a concurrent CUDA implementation. The code will be released publicly after the review.</abstract>
       <url hash="288e7385">2021.naacl-industry.15</url>
diff --git a/data/xml/2021.wmt.xml b/data/xml/2021.wmt.xml
index 2df80ca98f..c9bed4b19a 100644
--- a/data/xml/2021.wmt.xml
+++ b/data/xml/2021.wmt.xml
@@ -259,7 +259,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <pages>187–196</pages>
diff --git a/data/xml/2022.aacl.xml b/data/xml/2022.aacl.xml
index 68f2393158..19f589335b 100644
--- a/data/xml/2022.aacl.xml
+++ b/data/xml/2022.aacl.xml
@@ -553,7 +553,7 @@
     <paper id="44">
       <title><fixed-case>SAPG</fixed-case>raph: Structure-aware Extractive Summarization for Scientific Papers with Heterogeneous Graph</title>
       <author><first>Siya</first><last>Qi</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yiyang</first><last>Li</last></author>
       <author><first>Jin</first><last>Jiang</last></author>
       <author><first>Dingxin</first><last>Hu</last></author>
diff --git a/data/xml/2022.acl.xml b/data/xml/2022.acl.xml
index fd1624a921..4fab3c8f51 100644
--- a/data/xml/2022.acl.xml
+++ b/data/xml/2022.acl.xml
@@ -278,7 +278,7 @@
       <author><first>Shijie</first><last>Geng</last></author>
       <author><first>Zuohui</first><last>Fu</last></author>
       <author><first>Yingqiang</first><last>Ge</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author orcid="0000-0002-2930-2059"><first>Gerard</first><last>de Melo</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <pages>244-255</pages>
@@ -707,7 +707,7 @@
       <author><first>Qian</first><last>Dong</last></author>
       <author><first>Yaoming</first><last>Zhu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>680-694</pages>
       <abstract>How to find proper moments to generate partial sentence translation given a streaming speech input? Existing approaches waiting-and-translating for a fixed duration often break the acoustic units in speech, since the boundaries between acoustic units in speech are not even. In this paper, we propose MoSST, a simple yet effective method for translating streaming speech content. Given a usually long speech sequence, we develop an efficient monotonic segmentation module inside an encoder-decoder model to accumulate acoustic information incrementally and detect proper speech unit boundaries for the input in speech translation task. Experiments on multiple translation directions of the MuST-C dataset show that outperforms existing methods and achieves the best trade-off between translation quality (BLEU) and latency. Our code is available at <url>https://github.com/dqqcasia/mosst</url>.</abstract>
       <url hash="c3f93720">2022.acl-long.50</url>
@@ -2657,7 +2657,7 @@
       <author><first>Wangchunshu</first><last>Zhou</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2701-2714</pages>
       <abstract>Currently, masked language modeling (e.g., BERT) is the prime choice to learn contextualized representations. Due to the pervasiveness, it naturally raises an interesting question: how do masked language models (MLMs) learn contextual representations? In this work, we analyze the learning dynamics of MLMs and find that it adopts sampled embeddings as anchors to estimate and inject contextual semantics to representations, which limits the efficiency and effectiveness of MLMs. To address these problems, we propose TACO, a simple yet effective representation learning approach to directly model global semantics. To be specific, TACO extracts and aligns contextual semantics hidden in contextualized representations to encourage models to attend global semantics when generating contextualized representations. Experiments on the GLUE benchmark show that TACO achieves up to 5x speedup and up to 1.2 points average improvement over MLM.</abstract>
       <url hash="0b45c9f9">2022.acl-long.193</url>
@@ -6668,7 +6668,7 @@ in the Case of Unambiguous Gender</title>
       <title><fixed-case>STEMM</fixed-case>: Self-learning with Speech-text Manifold Mixup for Speech Translation</title>
       <author orcid="0000-0001-8575-591X"><first>Qingkai</first><last>Fang</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yang</first><last>Feng</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <pages>7050-7062</pages>
@@ -7423,7 +7423,7 @@ in the Case of Unambiguous Gender</title>
       <author><first>Mosha</first><last>Chen</last></author>
       <author><first>Zhen</first><last>Bi</last></author>
       <author><first>Xiaozhuan</first><last>Liang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Xin</first><last>Shang</last></author>
       <author><first>Kangping</first><last>Yin</last></author>
       <author orcid="0000-0002-6676-3057"><first>Chuanqi</first><last>Tan</last></author>
@@ -7867,7 +7867,7 @@ in the Case of Unambiguous Gender</title>
       <author><first>Lihua</first><last>Qian</last></author>
       <author><first>Xinyu</first><last>Dai</last></author>
       <author><first>Jiajun</first><last>Chen</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>8398-8409</pages>
       <abstract>Recently, parallel text generation has received widespread attention due to its success in generation efficiency. Although many advanced techniques are proposed to improve its generation quality, they still need the help of an autoregressive model for training to overcome the one-to-many multi-modal phenomenon in the dataset, limiting their applications. In this paper, we propose GLAT, which employs the discrete latent variables to capture word categorical information and invoke an advanced curriculum learning technique, alleviating the multi-modality problem. Experiment results show that our method outperforms strong baselines without the help of an autoregressive model, which further broadens the application scenarios of the parallel decoding paradigm.</abstract>
       <url hash="2427c3b4">2022.acl-long.575</url>
diff --git a/data/xml/2022.coling.xml b/data/xml/2022.coling.xml
index 2dbc4374c6..bfdedc0130 100644
--- a/data/xml/2022.coling.xml
+++ b/data/xml/2022.coling.xml
@@ -2431,7 +2431,7 @@
     <paper id="209">
       <title><fixed-case>L</fixed-case>ight<fixed-case>NER</fixed-case>: A Lightweight Tuning Paradigm for Low-resource <fixed-case>NER</fixed-case> via Pluggable Prompting</title>
       <author><first>Xiang</first><last>Chen</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Shumin</first><last>Deng</last></author>
       <author><first>Chuanqi</first><last>Tan</last></author>
       <author><first>Changliang</first><last>Xu</last></author>
@@ -2759,7 +2759,7 @@
       <title>Augmenting Legal Judgment Prediction with Contrastive Case Relations</title>
       <author><first>Dugang</first><last>Liu</last></author>
       <author><first>Weihao</first><last>Du</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Weike</first><last>Pan</last></author>
       <author><first>Zhong</first><last>Ming</last></author>
       <pages>2658–2667</pages>
diff --git a/data/xml/2022.emnlp.xml b/data/xml/2022.emnlp.xml
index 1a6a3b5d0d..7517e92f00 100644
--- a/data/xml/2022.emnlp.xml
+++ b/data/xml/2022.emnlp.xml
@@ -11465,7 +11465,7 @@
       <author><first>Minghui</first><last>Qiu</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Taolin</first><last>Zhang</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Tingting</first><last>Liu</last><affiliation>East China Normal University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Jianing</first><last>Wang</last><affiliation>East China Normal University</affiliation></author>
       <author id="ming-wang"><first>Ming</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Jun</first><last>Huang</last><affiliation>Alibaba Group</affiliation></author>
@@ -11575,7 +11575,7 @@
       <author><first>Xin</first><last>Xie</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Xiang</first><last>Chen</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Zhoubo</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
       <pages>98-108</pages>
       <abstract>We present an open-source and extensible knowledge extraction toolkit DeepKE, supporting complicated low-resource, document-level and multimodal scenarios in the knowledge base population. DeepKE implements various information extraction tasks, including named entity recognition, relation extraction and attribute extraction. With a unified framework, DeepKE allows developers and researchers to customize datasets and models to extract information from unstructured data according to their requirements. Specifically, DeepKE not only provides various functional modules and model implementation for different tasks and scenarios but also organizes all components by consistent frameworks to maintain sufficient modularity and extensibility. We release the source code at GitHub in <url>https://github.com/zjunlp/DeepKE</url> with Google Colab tutorials and comprehensive documents for beginners. Besides, we present an online system in <url>http://deepke.openkg.cn/EN/re_doc_show.html</url> for real-time extraction of various tasks, and a demo video.</abstract>
       <url hash="6ef4af1e">2022.emnlp-demos.10</url>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 9565c09e27..8678f386d4 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -880,7 +880,7 @@
       <author><first>Xuandong</first><last>Zhao</last></author>
       <author><first>Zhiguo</first><last>Yu</last></author>
       <author><first>Ming</first><last>Wu</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>774-781</pages>
       <abstract>How to learn highly compact yet effective sentence representation? Pre-trained language models have been effective in many NLP tasks. However, these models are often huge and produce large sentence embeddings. Moreover, there is a big performance gap between large and small models. In this paper, we propose Homomorphic Projective Distillation (HPD) to learn compressed sentence embeddings. Our method augments a small Transformer encoder model with learnable projection layers to produce compact representations while mimicking a large pre-trained language model to retain the sentence representation quality. We evaluate our method with different model sizes on both semantic textual similarity (STS) and semantic retrieval (SR) tasks. Experiments show that our method achieves 2.7-4.5 points performance gain on STS tasks compared with previous best representations of the same size. In SR tasks, our method improves retrieval speed (8.2×) and memory usage (8.0×) compared with state-of-the-art large models. Our implementation is available at <url>https://github.com/XuandongZhao/HPD</url>.</abstract>
       <url hash="3c74a3f8">2022.findings-acl.64</url>
@@ -3803,7 +3803,7 @@
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
       <author><first>Jiajun</first><last>Chen</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3537-3548</pages>
       <abstract>This paper does not aim at introducing a novel model for document-level neural machine translation. Instead, we head back to the original Transformer model and hope to answer the following question: Is the capacity of current models strong enough for document-level translation? Interestingly, we observe that the original Transformer with appropriate training techniques can achieve strong results for document translation, even with a length of 2000 words. We evaluate this model and several recent approaches on nine document-level datasets and two sentence-level datasets across six languages. Experiments show that document-level Transformer models outperforms sentence-level ones and many previous methods in a comprehensive set of metrics, including BLEU, four lexical indices, three newly proposed assistant linguistic indicators, and human evaluation.</abstract>
       <url hash="621a01ad">2022.findings-acl.279</url>
@@ -4226,7 +4226,7 @@
       <author><first>Zhongqiao</first><last>Li</last></author>
       <author><first>Xinbo</first><last>Zhang</last></author>
       <author><first>Changzhi</first><last>Sun</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yanghua</first><last>Xiao</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <pages>3941-3955</pages>
@@ -4371,7 +4371,7 @@
     </paper>
     <paper id="322">
       <title>Structural Supervision for Word Alignment and Machine Translation</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Kai</first><last>Fan</last></author>
       <author><first>Hongjia</first><last>Li</last></author>
       <author><first>Chun</first><last>Yuan</last></author>
@@ -6196,7 +6196,7 @@
       <title>Good Visual Guidance Make A Better Extractor: Hierarchical Visual Prefix for Multimodal Entity and Relation Extraction</title>
       <author><first>Xiang</first><last>Chen</last></author>
       <author><first>Ningyu</first><last>Zhang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yunzhi</first><last>Yao</last></author>
       <author><first>Shumin</first><last>Deng</last></author>
       <author orcid="0000-0002-6676-3057"><first>Chuanqi</first><last>Tan</last></author>
@@ -7198,7 +7198,7 @@
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>2508-2527</pages>
       <abstract>We introduce MTG, a new benchmark suite for training and evaluating multilingual text generation. It is the first-proposed multilingual multiway text generation dataset with the largest human-annotated data (400k). It includes four generation tasks (story generation, question generation, title generation and text summarization) across five languages (English, German, French, Spanish and Chinese). The multiway setup enables testing knowledge transfer capabilities for a model across languages and tasks. Using MTG, we train and analyze several popular multilingual generation models from different aspects. Our benchmark suite fosters model performance enhancement with more human-annotated parallel data. It provides comprehensive evaluations with diverse generation scenarios. Code and data are available at <url>https://github.com/zide05/MTG</url>.</abstract>
       <url hash="dad0ea74">2022.findings-naacl.192</url>
@@ -8908,7 +8908,7 @@
       <author><first>Tingting</first><last>Liu</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Chengyu</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Xiangru</first><last>Zhu</last><affiliation>Fudan University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Minghui</first><last>Qiu</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Jun</first><last>Huang</last><affiliation>alibaba group</affiliation></author>
       <author><first>Ming</first><last>Gao</last><affiliation>East China Normal University</affiliation></author>
@@ -11942,7 +11942,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Siyi</first><last>Wang</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Kai</first><last>Wang</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Yanquan</first><last>Zhou</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Qing</first><last>Yang</last><affiliation>Du Xiaoman Technology(Beijing)</affiliation></author>
       <author><first>Dongliang</first><last>Xu</last><affiliation>Du Xiaoman Technology(Beijing)</affiliation></author>
       <pages>3880-3886</pages>
@@ -13046,7 +13046,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
     <paper id="370">
       <title>Distillation-Resistant Watermarking for Model Protection in <fixed-case>NLP</fixed-case></title>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yu-Xiang</first><last>Wang</last><affiliation>UCSB</affiliation></author>
       <pages>5044-5055</pages>
       <abstract>How can we protect the intellectual property of trained NLP models? Modern NLP models are prone to stealing by querying and distilling from their publicly exposed APIs. However, existing protection methods such as watermarking only work for images but are not applicable to text. We propose Distillation-Resistant Watermarking (DRW), a novel technique to protect NLP models from being stolen via distillation. DRW protects a model by injecting watermarks into the victim’s prediction probability corresponding to a secret key and is able to detect such a key by probing a suspect model. We prove that a protected model still retains the original accuracy within a certain bound. We evaluate DRW on a diverse set of NLP tasks including text classification, part-of-speech tagging, and named entity recognition. Experiments show that DRW protects the original model and detects stealing suspects at 100% mean average precision for all four tasks while the prior method fails on two.</abstract>
@@ -13946,7 +13946,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Yifan</first><last>Song</last><affiliation>Peking University</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last><affiliation>Shanghai AI Lab</affiliation></author>
       <author><first>Zhifang</first><last>Sui</last><affiliation>Peking University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>5937-5947</pages>
       <abstract>Previous literature has proved that Pretrained Language Models (PLMs) can store factual knowledge. However, we find that facts stored in the PLMs are not always correct. It motivates us to explore a fundamental question: How do we calibrate factual knowledge in PLMs without re-training from scratch? In this work, we propose a simple and lightweight method CaliNet to achieve this goal. To be specific, we first detect whether PLMs can learn the right facts via a contrastive score between right and fake facts. If not, we then use a lightweight method to add and adapt new parameters to specific factual texts. Experiments on the knowledge probing task show the calibration effectiveness and efficiency. In addition, through closed-book question answering, we find that the calibrated PLM possesses knowledge generalization ability after finetuning.Beyond the calibration performance, we further investigate and visualize the knowledge calibration mechanism.</abstract>
       <url hash="1649bf53">2022.findings-emnlp.438</url>
@@ -14453,7 +14453,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
     </paper>
     <paper id="477">
       <title>From Mimicking to Integrating: Knowledge Integration for Pre-Trained Language Models</title>
-      <author><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author><first>Yankai</first><last>Lin</last><affiliation>Gaoling School of Artificial Intelligence, Renmin University of China</affiliation></author>
       <author><first>Xuancheng</first><last>Ren</last><affiliation>Peking University</affiliation></author>
       <author><first>Guangxiang</first><last>Zhao</last><affiliation>Peking University</affiliation></author>
@@ -14613,7 +14613,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Yi-Lin</first><last>Tuan</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Yujie</first><last>Lu</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Michael</first><last>Saxon</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>Unversity of California, Santa Barbara</affiliation></author>
       <pages>6559-6574</pages>
       <abstract>Is it possible to build a general and automatic natural language generation (NLG) evaluation metric? Existing learned metrics either perform unsatisfactorily or are restricted to tasks where large human rating data is already available. We introduce SESCORE, a model-based metric that is highly correlated with human judgements without requiring human annotation, by utilizing a novel, iterative error synthesis and severity scoring pipeline. This pipeline applies a series of plausible errors to raw text and assigns severity labels by simulating human judgements with entailment. We evaluate SESCORE against existing metrics by comparing how their scores correlate with human ratings. SESCORE outperforms all prior unsupervised metrics on multiple diverse NLG tasks including machine translation, image captioning, and WebNLG text generation. For WMT 20/21En-De and Zh-En, SESCORE improve the average Kendall correlation with human judgement from 0.154 to 0.195. SESCORE even achieves comparable performance to the best supervised metric COMET, despite receiving no human annotated training data.</abstract>
diff --git a/data/xml/2022.iwslt.xml b/data/xml/2022.iwslt.xml
index 07610a69ea..3525f423fa 100644
--- a/data/xml/2022.iwslt.xml
+++ b/data/xml/2022.iwslt.xml
@@ -112,7 +112,7 @@
       <title>On the Impact of Noises in Crowd-Sourced Data for Speech Translation</title>
       <author><first>Siqi</first><last>Ouyang</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>92-97</pages>
       <abstract>Training speech translation (ST) models requires large and high-quality datasets. MuST-C is one of the most widely used ST benchmark datasets. It contains around 400 hours of speech-transcript-translation data for each of the eight translation directions. This dataset passes several quality-control filters during creation. However, we find that MuST-C still suffers from three major quality issues: audiotext misalignment, inaccurate translation, and unnecessary speaker’s name. What are the impacts of these data quality issues for model development and evaluation? In this paper, we propose an automatic method to fix or filter the above quality issues, using English-German (En-De) translation as an example. Our experiments show that ST models perform better on clean test sets, and the rank of proposed models remains consistent across different test sets. Besides, simply removing misaligned data points from the training set does not lead to a better ST model.</abstract>
       <url hash="5f7124cd">2022.iwslt-1.9</url>
diff --git a/data/xml/2022.naacl.xml b/data/xml/2022.naacl.xml
index e51dd12cb9..6c56c243dc 100644
--- a/data/xml/2022.naacl.xml
+++ b/data/xml/2022.naacl.xml
@@ -973,7 +973,7 @@
     <paper id="69">
       <title>Provably Confidential Language Modelling</title>
       <author><first>Xuandong</first><last>Zhao</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last></author>
       <pages>943-955</pages>
       <abstract>Large language models are shown to memorize privacy information such as social security numbers in training data. Given the sheer scale of the training corpus, it is challenging to screen and filter these privacy data, either manually or automatically. In this paper, we propose Confidentially Redacted Training (CRT), a method to train language generation models while protecting the confidential segments. We borrow ideas from differential privacy (which solves a related but distinct problem) and show that our method is able to provably prevent unintended memorization by randomizing parts of the training process. Moreover, we show that redaction with an approximately correct screening policy amplifies the confidentiality guarantee. We implement the method for both LSTM and GPT language models. Our experimental results show that the models trained by CRT obtain almost the same perplexity while preserving strong confidentiality.</abstract>
@@ -5242,7 +5242,7 @@
       <title>Cross-modal Contrastive Learning for Speech Translation</title>
       <author><first>Rong</first><last>Ye</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>5099-5113</pages>
       <abstract>How can we learn unified representations for spoken utterances and their written text? Learning similar representations for semantically similar speech and text is important for speech translation. To this end, we propose ConST, a cross-modal contrastive learning method for end-to-end speech-to-text translation. We evaluate ConST and a variety of previous baselines on a popular benchmark MuST-C. Experiments show that the proposed ConST consistently outperforms the previous methods, and achieves an average BLEU of 29.4. The analysis further verifies that ConST indeed closes the representation gap of different modalities — its learned representation improves the accuracy of cross-modal speech-text retrieval from 4% to 88%. Code and models are available at <url>https://github.com/ReneeYe/ConST</url>.</abstract>
       <url hash="049e5219">2022.naacl-main.376</url>
diff --git a/data/xml/2023.acl.xml b/data/xml/2023.acl.xml
index 0137f0c46e..e0dcf75007 100644
--- a/data/xml/2023.acl.xml
+++ b/data/xml/2023.acl.xml
@@ -3036,7 +3036,7 @@
       <title><fixed-case>WACO</fixed-case>: Word-Aligned Contrastive Learning for Speech Translation</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Rong</first><last>Ye</last><affiliation>ByteDance AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>3891-3907</pages>
       <abstract>End-to-end Speech Translation (E2E ST) aims to directly translate source speech into target text. Existing ST methods perform poorly when only extremely small speech-text data are available for training. We observe that an ST model’s performance closely correlates with its embedding similarity between speech and source transcript. In this paper, we propose Word-Aligned COntrastive learning (WACO), a simple and effective method for extremely low-resource speech-to-text translation. Our key idea is bridging word-level representations for both speech and text modalities via contrastive learning. We evaluate WACO and other methods on the MuST-C dataset, a widely used ST benchmark, and on a low-resource direction Maltese-English from IWSLT 2023. Our experiments demonstrate that WACO outperforms the best baseline by 9+ BLEU points with only 1-hour parallel ST data. Code is available at <url>https://github.com/owaski/WACO</url>.</abstract>
       <url hash="fb81ce2d">2023.acl-long.216</url>
@@ -4007,7 +4007,7 @@
       <author><first>Wenda</first><last>Xu</last><affiliation>University of California at Santa Barbara</affiliation></author>
       <author><first>Xian</first><last>Qian</last><affiliation>ByteDance AI LAB</affiliation></author>
       <author><first>Mingxuan</first><last>Wang</last><affiliation>Bytedance AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>Unversity of California, Santa Barbara</affiliation></author>
       <pages>5166-5183</pages>
       <abstract>Is it possible to train a general metric for evaluating text generation quality without human-annotated ratings? Existing learned metrics either perform unsatisfactory across text generation tasks or require human ratings for training on specific tasks. In this paper, we propose SEScore2, a self-supervised approach for training a model-based metric for text generation evaluation. The key concept is to synthesize realistic model mistakes by perturbing sentences retrieved from a corpus. We evaluate SEScore2 and previous methods on four text generation tasks across three languages. SEScore2 outperforms all prior unsupervised metrics on four text generation evaluation benchmarks, with an average Kendall improvement of 0.158. Surprisingly, SEScore2 even outperforms the supervised BLEURT and COMET on multiple text generation tasks.</abstract>
@@ -7899,7 +7899,7 @@
       <author><first>Wei</first><last>Shi</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ziquan</first><last>Fu</last><affiliation>System, Inc</affiliation></author>
       <author orcid="0000-0001-6332-5732"><first>Sijie</first><last>Cheng</last><affiliation>Fudan University</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yanghua</first><last>Xiao</last><affiliation>Fudan University</affiliation></author>
       <pages>9890-9908</pages>
       <abstract>Large language models (LLMs) have been widely studied for their ability to store and utilize positive knowledge. However, negative knowledge, such as “lions don’t live in the ocean”, is also ubiquitous in the world but rarely mentioned explicitly in text. What do LLMs know about negative knowledge?This work examines the ability of LLMs on negative commonsense knowledge. We design a constrained keywords-to-sentence generation task (CG) and a Boolean question answering task (QA) to probe LLMs.Our experiments reveal that LLMs frequently fail to generate valid sentences grounded in negative commonsense knowledge, yet they can correctly answer polar yes-or-no questions. We term this phenomenon the belief conflict of LLMs.Our further analysis shows that statistical shortcuts and negation reporting bias from language modeling pre-training cause this conflict.</abstract>
@@ -12505,7 +12505,7 @@
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Zhiguo</first><last>Yu</last><affiliation>Microsoft</affiliation></author>
       <author><first>Ming</first><last>Wu</last><affiliation>GitHub, Inc.</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>15590-15606</pages>
       <abstract>How can we extend a pre-trained model to many language understanding tasks, without labeled or additional unlabeled data? Pre-trained language models (PLMs) have been effective for a wide range of NLP tasks. However, existing approaches either require fine-tuning on downstream labeled datasets or manually constructing proper prompts. In this paper, we propose nonparametric prompting PLM (NPPrompt) for fully zero-shot language understanding. Unlike previous methods, NPPrompt uses only pre-trained language models and does not require any labeled data or additional raw corpus for further fine-tuning, nor does it rely on humans to construct a comprehensive set of prompt label words. We evaluate NPPrompt against previous major few-shot and zero-shot learning methods on diverse NLP tasks: including text classification, text entailment, similar text retrieval, paraphrasing, and multiple-choice question answering. Experimental results demonstrate that our NPPrompt outperforms the previous best fully zero-shot method by big margins, with absolute gains of 12.8% in accuracy on text classification and 15.6% on the GLUE benchmark. Our source code is available at <url>https://anonymous.4open.science/r/NPPrompt</url>.</abstract>
       <url hash="09d5815c">2023.acl-long.869</url>
@@ -16901,7 +16901,7 @@
       <title><fixed-case>F</fixed-case>ashion<fixed-case>KLIP</fixed-case>: Enhancing <fixed-case>E</fixed-case>-Commerce Image-Text Retrieval with Fashion Multi-Modal Conceptual Knowledge Graph</title>
       <author><first>Xiaodan</first><last>Wang</last><affiliation>Fudan University</affiliation></author>
       <author><first>Chengyu</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Zhixu</first><last>Li</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ben</first><last>Chen</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Linbo</first><last>Jin</last><affiliation>Alibaba</affiliation></author>
diff --git a/data/xml/2023.americasnlp.xml b/data/xml/2023.americasnlp.xml
index 2a7fc31a22..5f13fb31f4 100644
--- a/data/xml/2023.americasnlp.xml
+++ b/data/xml/2023.americasnlp.xml
@@ -230,7 +230,7 @@
       <author><first>Tianrui</first><last>Gu</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Kaie</first><last>Chen</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>173-176</pages>
       <abstract>This paper presents PlayGround’s submission to the AmericasNLP 2023 shared task on machine translation (MT) into indigenous languages. We finetuned NLLB-600M, a multilingual MT model pre-trained on Flores-200, on 10 low-resource language directions and examined the effectiveness of weight averaging and back translation. Our experiments showed that weight averaging, on average, led to a 0.0169 improvement in the ChrF++ score. Additionally, we found that back translation resulted in a 0.008 improvement in the ChrF++ score.</abstract>
       <url hash="70c4244c">2023.americasnlp-1.19</url>
diff --git a/data/xml/2023.emnlp.xml b/data/xml/2023.emnlp.xml
index b333e00563..ee7dd7e37b 100644
--- a/data/xml/2023.emnlp.xml
+++ b/data/xml/2023.emnlp.xml
@@ -4156,7 +4156,7 @@
     <paper id="296">
       <title>Can We Edit Factual Knowledge by In-Context Learning?</title>
       <author><first>Ce</first><last>Zheng</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
       <author><first>Yuxuan</first><last>Fan</last></author>
       <author><first>Zhiyong</first><last>Wu</last></author>
@@ -5132,7 +5132,7 @@
       <author><first>Zhenqiao</first><last>Song</last></author>
       <author><first>Markus</first><last>Freitag</last></author>
       <author><first>William</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>5967-5994</pages>
       <abstract>Automatically evaluating the quality of language generation is critical. Although recent learned metrics show high correlation with human judgement, these metrics do not provide explicit explanation of their verdict, nor associate the scores with defects in the generated text. To address this limitation, we present INSTRUCTSCORE, a fine-grained explainable evaluation metric for text generation. By harnessing both explicit human instruction and the implicit knowledge of GPT-4, we fine-tune a text evaluation metric based on LLaMA, producing both a score for generated text and a human readable diagnostic report. We evaluate INSTRUCTSCORE on a variety of generation tasks, including translation, captioning, data-to-text, and commonsense generation. Experiments show that our 7B model surpasses all other unsupervised metrics, including those based on 175B GPT-3 and GPT-4. Surprisingly, our INSTRUCTSCORE, even without direct supervision from human-rated data, achieves performance levels on par with state-of-the-art metrics like COMET22, which were fine-tuned on human ratings.</abstract>
       <url hash="67ecf0cc">2023.emnlp-main.365</url>
@@ -8511,7 +8511,7 @@
     <paper id="609">
       <title>Label Words are Anchors: An Information Flow Perspective for Understanding In-Context Learning</title>
       <author><first>Lean</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
@@ -9223,7 +9223,7 @@
     <paper id="659">
       <title>Learning from Mistakes via Cooperative Study Assistant for Large Language Models</title>
       <author><first>Danqing</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>10667-10685</pages>
       <abstract>Large language models (LLMs) have demonstrated their potential to refine their generation based on their own feedback. However, the feedback from LLM itself is often inaccurate, thereby limiting its benefits. In this paper, we propose Study Assistant for Large LAnguage Model (SALAM), a novel framework with an auxiliary agent to assist the main LLM in learning from mistakes through interactive cooperation. In the gathering phase, the student assistant agent probes the main LLM, analyzes its errors, and collects the interaction in a mistake memory. During the examination phase, the study assistant provides guidelines by retrieving relevant cases to help the main LLM anticipate and avoid similar errors. We first investigate the effectiveness of a general study assistant and then customize it to provide LLM-specific guidance through imitation learning from successful guidance experiences. Our experiments on three LLMs using two challenging frameworks demonstrate that SALAM can significantly boost LLMs by an accuracy margin of up to 6.6 on BBH and 12.6 on BBQ.</abstract>
       <url hash="36ec977f">2023.emnlp-main.659</url>
@@ -10152,7 +10152,7 @@
     </paper>
     <paper id="726">
       <title>Can Language Models Understand Physical Concepts?</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
       <author><first>Ce</first><last>Zheng</last></author>
diff --git a/data/xml/2023.findings.xml b/data/xml/2023.findings.xml
index c14c5e0829..b5af6bc1be 100644
--- a/data/xml/2023.findings.xml
+++ b/data/xml/2023.findings.xml
@@ -4664,7 +4664,7 @@
       <author><first>Yongkang</first><last>Wu</last><affiliation>Huawei</affiliation></author>
       <author><first>Meng</first><last>Han</last><affiliation>Huawei</affiliation></author>
       <author orcid="0000-0002-9432-3251"><first>Yutao</first><last>Zhu</last><affiliation>University of Montreal</affiliation></author>
-      <author orcid="0000-0002-7413-2458"><first>Lei</first><last>Li</last><affiliation>Huawei</affiliation></author>
+      <author orcid="0000-0002-7413-2458" id="lei-li"><first>Lei</first><last>Li</last><affiliation>Huawei</affiliation></author>
       <author orcid="0000-0002-6829-4522"><first>Xinyu</first><last>Zhang</last><affiliation>Huawei Technologies Co., Ltd</affiliation></author>
       <author><first>Ruofei</first><last>Lai</last><affiliation>Huawei</affiliation></author>
       <author><first>Xiaoguang</first><last>Li</last><affiliation>Huawei Noah’s Ark Lab</affiliation></author>
@@ -7044,7 +7044,7 @@
       <title>Communication Efficient Federated Learning for Multilingual Neural Machine Translation with Adapter</title>
       <author><first>Yi</first><last>Liu</last><affiliation>School of Computer Science, Peking University</affiliation></author>
       <author><first>Xiaohan</first><last>Bi</last><affiliation>Peking University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author><first>Sishuo</first><last>Chen</last><affiliation>Center for Data Science, Peking University</affiliation></author>
       <author orcid="0000-0003-1942-7998"><first>Wenkai</first><last>Yang</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0001-8241-9320"><first>Xu</first><last>Sun</last><affiliation>Peking University</affiliation></author>
@@ -7617,7 +7617,7 @@
       <title><fixed-case>LET</fixed-case>: Leveraging Error Type Information for Grammatical Error Correction</title>
       <author><first>Lingyu</first><last>Yang</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Hongjia</first><last>Li</last><affiliation>Tsinghua University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Tsinghua University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tsinghua University</affiliation></author>
       <author orcid="0000-0003-2901-3342"><first>Chengyin</first><last>Xu</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Shutao</first><last>Xia</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Chun</first><last>Yuan</last><affiliation>Tsinghua University</affiliation></author>
@@ -10714,7 +10714,7 @@
     <paper id="610">
       <title>Delving into the Openness of <fixed-case>CLIP</fixed-case></title>
       <author><first>Shuhuai</first><last>Ren</last><affiliation>Peking University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0002-6994-2114"><first>Xuancheng</first><last>Ren</last><affiliation>DAMO Academy, Alibaba Group</affiliation></author>
       <author orcid="0000-0002-3046-512X"><first>Guangxiang</first><last>Zhao</last><affiliation>Shanghai AI lab</affiliation></author>
       <author orcid="0000-0001-8241-9320"><first>Xu</first><last>Sun</last><affiliation>Peking University</affiliation></author>
@@ -12344,7 +12344,7 @@
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
       <author><first>Wenhao</first><last>Zhu</last><affiliation>National Key Laboratory for Novel Software Technology, Nanjing University</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>The University of Hong Kong</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yu</first><last>Qiao</last><affiliation>Shanghai AI Lab</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last><affiliation>Shanghai AI Lab</affiliation></author>
       <pages>11518-11533</pages>
@@ -16398,7 +16398,7 @@
       <title><fixed-case>I</fixed-case>mage<fixed-case>N</fixed-case>et<fixed-case>VC</fixed-case>: Zero- and Few-Shot Visual Commonsense Evaluation on 1000 <fixed-case>I</fixed-case>mage<fixed-case>N</fixed-case>et Categories</title>
       <author><first>Heming</first><last>Xia</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Ziwei</first><last>Qin</last></author>
@@ -17331,7 +17331,7 @@
     <paper id="205">
       <title><fixed-case>A</fixed-case>uto<fixed-case>P</fixed-case>lan: Automatic Planning of Interactive Decision-Making Tasks With Large Language Models</title>
       <author><first>Siqi</first><last>Ouyang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3114-3128</pages>
       <abstract>Recent large language models (LLMs) are promising for making decisions in grounded environments. However, LLMs frequently fail in complex decision-making tasks due to the misalignment between the pre-trained knowledge in LLMs and the actual rules in the environment. Existing methods require either costly gradient computation or lengthy in-context demonstrations. In this paper, we propose AutoPlan, an approach to guide LLM-based agents to accomplish interactive decision-making tasks. AutoPlan augments the LLM prompt with a task-solving plan and optimizes it through iterative experience collection and reflection. Our experiments show that AutoPlan, though using no in-context demonstrations, achieves success rates on par with the baselines using human-written demonstrations on ALFWorld and even outperforms them by 8% on HotpotQA. The code is available at https://github.com/owaski/AutoPlan.</abstract>
       <url hash="225682fd">2023.findings-emnlp.205</url>
@@ -28056,7 +28056,7 @@
       <author><first>Bohong</first><last>Wu</last></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <author><first>Hai</first><last>Zhao</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <pages>15432-15444</pages>
       <abstract>Multilingual understanding models (or encoder-based), pre-trained via masked language modeling, have achieved promising results on many language understanding tasks (e.g., mBERT). However, these models are not capable of generating high-quality text compared with decoder-based causal language models. Can we transform a pre-trained language understanding model into an effective language generation model? We propose a Semantic-Guided Alignment-then-Denoising (SGA) approach to adapt a multilingual encoder to a multilingual generator with a small number of additional parameters. Experiments show that the proposed approach is an effective adaption method, outperforming widely-used initialization-based methods with gains of 9.4 BLEU on machine translation, 8.1 Rouge-L on question generation, and 5.5 METEOR on story generation on XLM-R<tex-math>_{large}</tex-math>. On the other hand, we observe that XLM-R is still inferior to mBART in supervised settings despite better results on zero-shot settings, indicating that more exploration is required to make understanding models strong generators. Our code is available at https://github.com/chengzhipanpan/XLMR4MT.</abstract>
diff --git a/data/xml/2023.ijcnlp.xml b/data/xml/2023.ijcnlp.xml
index 8a6f4f1f91..292a8d1274 100644
--- a/data/xml/2023.ijcnlp.xml
+++ b/data/xml/2023.ijcnlp.xml
@@ -1496,7 +1496,7 @@
       <author><first>Pengfei</first><last>Zhu</last></author>
       <author><first>Chao</first><last>Pang</last></author>
       <author><first>Yekun</first><last>Chai</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Shuohuan</first><last>Wang</last></author>
       <author><first>Yu</first><last>Sun</last></author>
       <author><first>Hao</first><last>Tian</last></author>
diff --git a/data/xml/2024.acl.xml b/data/xml/2024.acl.xml
index 6a03746558..0a00862971 100644
--- a/data/xml/2024.acl.xml
+++ b/data/xml/2024.acl.xml
@@ -7079,7 +7079,7 @@
     <paper id="510">
       <title>Math-Shepherd: Verify and Reinforce <fixed-case>LLM</fixed-case>s Step-by-step without Human Annotations</title>
       <author><first>Peiyi</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Zhihong</first><last>Shao</last><affiliation>Tsinghua University, Tsinghua University</affiliation></author>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Damai</first><last>Dai</last></author>
@@ -7096,7 +7096,7 @@
     <paper id="511">
       <title>Large Language Models are not Fair Evaluators</title>
       <author><first>Peiyi</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Liang</first><last>Chen</last></author>
       <author><first>Zefan</first><last>Cai</last></author>
       <author><first>Dawei</first><last>Zhu</last></author>
@@ -10832,7 +10832,7 @@
     </paper>
     <paper id="775">
       <title>Multimodal <fixed-case>A</fixed-case>r<fixed-case>X</fixed-case>iv: A Dataset for Improving Scientific Comprehension of Large Vision-Language Models</title>
-      <author><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Yuqi</first><last>Wang</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Runxin</first><last>Xu</last><affiliation>Peking University</affiliation></author>
       <author><first>Peiyi</first><last>Wang</last><affiliation>Peking University</affiliation></author>
@@ -11575,7 +11575,7 @@
       <author><first>Guanglei</first><last>Zhu</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
       <author><first>Liangming</first><last>Pan</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
       <pages>15474-15492</pages>
       <abstract>Recent studies show that large language models (LLMs) improve their performance through self-feedback on certain tasks while degrade on others. We discovered that such a contrary is due to LLM’s bias in evaluating their own output. In this paper, we formally define LLM’s self-bias – the tendency to favor its own generation – using two statistics. We analyze six LLMs (GPT-4, GPT-3.5, Gemini, LLaMA2, Mixtral and DeepSeek) on translation, constrained text generation, and mathematical reasoning tasks. We find that self-bias is prevalent in all examined LLMs across multiple languages and tasks. Our analysis reveals that while the self-refine pipeline improves the fluency and understandability of model outputs, it further amplifies self-bias. To mitigate such biases, we discover that larger model size and external feedback with accurate assessment can significantly reduce bias in the self-refine pipeline, leading to actual performance improvement in downstream tasks. The code and data are released at https://github.com/xu1998hz/llm_self_bias.</abstract>
@@ -13381,7 +13381,7 @@
       <author><first>Ziwen</first><last>Xu</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Shuofei</first><last>Qiao</last></author>
       <author><first>Runnan</first><last>Fang</last></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Zhen</first><last>Bi</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Guozhou</first><last>Zheng</last></author>
       <author><first>Huajun</first><last>Chen</last><affiliation>Zhejiang University</affiliation></author>
@@ -14422,7 +14422,7 @@
       <title>Watermarking for Large Language Models</title>
       <author><first>Xuandong</first><last>Zhao</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>10-11</pages>
       <abstract>As AI-generated text increasingly resembles human-written content, the ability to detect machine-generated text becomes crucial in both the computational linguistics and machine learning communities. In this tutorial, we aim to provide an in-depth exploration of text watermarking, a subfield of linguistic steganography with the goal of embedding a hidden message (the watermark) within a text passage. We will introduce the fundamentals of text watermarking, discuss the main challenges in identifying AI-generated text, and delve into the current watermarking methods, assessing their strengths and weaknesses. Moreover, we will explore other possible applications of text watermarking and discuss future directions for this field. Each section will be supplemented with examples and key takeaways.</abstract>
       <url hash="d0e779a1">2024.acl-tutorials.6</url>
diff --git a/data/xml/2024.ccl.xml b/data/xml/2024.ccl.xml
index af96f82500..44aa040fb4 100644
--- a/data/xml/2024.ccl.xml
+++ b/data/xml/2024.ccl.xml
@@ -1070,7 +1070,7 @@
       <author><first>Yuelou</first><last>Xu</last></author>
       <author><first>Yan</first><last>Lu</last></author>
       <author><first>Kai</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yanquan</first><last>Zhou</last></author>
       <pages>1123–1135</pages>
       <abstract>“The zero-resource cross-domain named entity recognition (NER) task aims to perform NER in aspecific domain where labeled data is unavailable. Existing methods primarily focus on transfer-ring NER knowledge from high-resource to zero-resource domains. However, the challenge liesin effectively transferring NER knowledge between domains due to the inherent differences inentity structures across domains. To tackle this challenge, we propose an Unsupervised DomainAdaptation Adversarial (UDAA) framework, which combines the masked language model auxil-iary task with the domain adaptive adversarial network to mitigate inter-domain differences andefficiently facilitate knowledge transfer. Experimental results on CBS, Twitter, and WNUT2016three datasets demonstrate the effectiveness of our framework. Notably, we achieved new state-of-the-art performance on the three datasets. Our code will be released.Introduction”</abstract>
diff --git a/data/xml/2024.emnlp.xml b/data/xml/2024.emnlp.xml
index b36fd0d2d0..b71bb6a0e9 100644
--- a/data/xml/2024.emnlp.xml
+++ b/data/xml/2024.emnlp.xml
@@ -902,7 +902,7 @@
     <paper id="64">
       <title>A Survey on In-context Learning</title>
       <author><first>Qingxiu</first><last>Dong</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Ce</first><last>Zheng</last><affiliation>Peking University</affiliation></author>
       <author><first>Jingyuan</first><last>Ma</last></author>
@@ -912,7 +912,7 @@
       <author><first>Zhiyong</first><last>Wu</last><affiliation>Shanghai Artificial Intelligence Laboratory</affiliation></author>
       <author><first>Baobao</first><last>Chang</last><affiliation>Peking University</affiliation></author>
       <author><first>Xu</first><last>Sun</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Zhifang</first><last>Sui</last><affiliation>Peking University</affiliation></author>
       <pages>1107-1128</pages>
       <abstract>With the increasing capabilities of large language models (LLMs), in-context learning (ICL) has emerged as a new paradigm for natural language processing (NLP), where LLMs make predictions based on contexts augmented with a few examples. It has been a significant trend to explore ICL to evaluate and extrapolate the ability of LLMs. In this paper, we aim to survey and summarize the progress and challenges of ICL. We first present a formal definition of ICL and clarify its correlation to related studies. Then, we organize and discuss advanced techniques, including training strategies, prompt designing strategies, and related analysis. Additionally, we explore various ICL application scenarios, such as data engineering and knowledge updating. Finally, we address the challenges of ICL and suggest potential directions for further research. We hope that our work can encourage more research on uncovering how ICL works and improving ICL.</abstract>
@@ -5036,7 +5036,7 @@
     </paper>
     <paper id="358">
       <title><fixed-case>VLF</fixed-case>eedback: A Large-Scale <fixed-case>AI</fixed-case> Feedback Dataset for Large Vision-Language Models Alignment</title>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Zhihui</first><last>Xie</last><affiliation>Shanghai Jiao Tong University</affiliation></author>
       <author><first>Mukai</first><last>Li</last></author>
       <author><first>Shunian</first><last>Chen</last><affiliation>Shenzhen Research Institute of Big Data</affiliation></author>
@@ -8701,7 +8701,7 @@
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Jiachen</first><last>Li</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>11125-11139</pages>
       <abstract>Direct alignment from preferences (DAP) has emerged as a promising paradigm for aligning large language models (LLMs) to human desiderata from pre-collected, offline preference datasets. While recent studies indicate that existing offline DAP methods can directly benefit from online training samples, we highlight the need to develop specific online DAP algorithms to fully harness the power of online training. Specifically, we identify that the learned LLM should adhere to the proximity of the behavior LLM, which collects the training samples. To this end, we propose online Preference Optimization in proximity to the Behavior LLM (BPO), emphasizing the importance of constructing a proper trust region for LLM alignment.We conduct extensive experiments to validate the effectiveness and applicability of our approach by integrating it with various DAP methods, resulting in significant performance improvements across a wide range of tasks when training with the same amount of preference data. Even when only introducing one additional data collection phase, our online BPO improves its offline DAP baseline from 72.0% to 80.2% on TL;DR and from 82.2% to 89.1% on Anthropic Helpfulness in terms of win rate against human reference text.</abstract>
       <url hash="7b9d4802">2024.emnlp-main.623</url>
@@ -10250,7 +10250,7 @@
       <author><first>Hanlin</first><last>Zhu</last><affiliation>Electrical Engineering &amp; Computer Science Department, University of California Berkeley</affiliation></author>
       <author><first>Xiaomeng</first><last>Yang</last><affiliation>Google DeepMind</affiliation></author>
       <author><first>Andrew</first><last>Cohen</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0003-4202-4847"><first>Yuandong</first><last>Tian</last><affiliation>Meta AI (FAIR)</affiliation></author>
       <pages>13274-13292</pages>
       <abstract>Recent research has increasingly focused on evaluating large language models’ (LLMs) alignment with diverse human values and preferences, particularly for open-ended tasks like story generation. Traditional evaluation metrics rely heavily on lexical similarity with human-written references, often showing poor correlation with human judgments and failing to account for alignment with the diversity of human preferences. To address these challenges, we introduce PerSE, an interpretable evaluation framework designed to assess alignment with specific human preferences. It is tuned to infer specific preferences from an in-context personal profile and evaluate the alignment between the generated content and personal preferences. PerSE enhances interpretability by providing detailed comments and fine-grained scoring, facilitating more personalized content generation. Our 13B LLaMA-2-based PerSE shows a 15.8% increase in Kendall correlation and a 13.7% rise in accuracy with zero-shot reviewers compared to GPT-4. It also outperforms GPT-4 by 46.01% in Kendall correlation on new domains, indicating its transferability</abstract>
@@ -18075,7 +18075,7 @@
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Xi</first><last>Xu</last></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>344-350</pages>
       <abstract>With the rapid advancement of machine translation research, evaluation toolkits have become essential for benchmarking system progress. Tools like COMET and SacreBLEU offer single quality score assessments that are effective for pairwise system comparisons. However, these tools provide limited insights for fine-grained system-level comparisons and the analysis of instance-level defects. To address these limitations, we introduce <b>Translation Canvas</b>, an explainable interface designed to pinpoint and analyze translation systems’ performance: 1) Translation Canvas assists machine translation researchers in comprehending system-level model performance by identifying common errors (their frequency and severity) and analyzing relationships between different systems based on various evaluation metrics. 2) It supports fine-grained analysis by highlighting error spans with explanations and selectively displaying systems’ predictions. According to human evaluation, Translation Canvas demonstrates superior performance over COMET and SacreBLEU packages under enjoybility and understandbility criteria.</abstract>
       <url hash="258613e4">2024.emnlp-demo.36</url>
diff --git a/data/xml/2024.findings.xml b/data/xml/2024.findings.xml
index 3892c3c698..52ad9d01e8 100644
--- a/data/xml/2024.findings.xml
+++ b/data/xml/2024.findings.xml
@@ -3228,7 +3228,7 @@
       <author><first>Biao</first><last>Zhang</last><affiliation>Google DeepMind</affiliation></author>
       <author><first>Zhongtao</first><last>Liu</last><affiliation>Google</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Markus</first><last>Freitag</last><affiliation>Google</affiliation></author>
       <pages>1429-1445</pages>
       <abstract>Recent large language models (LLM) areleveraging human feedback to improve theirgeneration quality. However, human feedbackis costly to obtain, especially during inference.In this work, we propose LLMRefine, aninference time optimization method to refineLLM’s output. The core idea is to usea learned fine-grained feedback model topinpoint defects and guide LLM to refinethem iteratively. Using original LLM as aproposal of edits, LLMRefine searches fordefect-less text via simulated annealing, tradingoff the exploration and exploitation. Weconduct experiments on three text generationtasks, including machine translation, long-form question answering (QA), and topicalsummarization. LLMRefine consistentlyoutperforms all baseline approaches, achievingimprovements up to 1.7 MetricX points ontranslation tasks, 8.1 ROUGE-L on ASQA, 2.2ROUGE-L on topical summarization.</abstract>
@@ -4399,7 +4399,7 @@
       <author><first>Shujian</first><last>Huang</last><affiliation>Nanjing University</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
       <author><first>Jiajun</first><last>Chen</last><affiliation>Nanjing University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>2765-2781</pages>
       <abstract>Large language models (LLMs) have demonstrated remarkable potential in handling multilingual machine translation (MMT). In this paper, we systematically investigate the advantages and challenges of LLMs for MMT by answering two questions: 1) How well do LLMs perform in translating massive languages? 2) Which factors affect LLMs’ performance in translation? We thoroughly evaluate eight popular LLMs, including ChatGPT and GPT-4. Our empirical results show that translation capabilities of LLMs are continually involving. GPT-4 has beat the strong supervised baseline NLLB in 40.91% of translation directions but still faces a large gap towards the commercial translation system like Google Translate, especially on low-resource languages. Through further analysis, we discover that LLMs exhibit new working patterns when used for MMT. First, LLM can acquire translation ability in a resource-efficient way and generate moderate translation even on zero-resource languages. Second, instruction semantics can surprisingly be ignored when given in-context exemplars. Third, cross-lingual exemplars can provide better task guidance for low-resource translation than exemplars in the same language pairs. Code will be released at: https://github.com/NJUNLP/MMT-LLM.</abstract>
       <url hash="321e3b0c">2024.findings-naacl.176</url>
@@ -8815,7 +8815,7 @@
     <paper id="198">
       <title>Red Teaming Visual Language Models</title>
       <author><first>Mukai</first><last>Li</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0002-5022-6468"><first>Yuwei</first><last>Yin</last></author>
       <author><first>Masood</first><last>Ahmed</last></author>
       <author><first>Zhenguang</first><last>Liu</last><affiliation>Zhejiang University</affiliation></author>
@@ -13143,7 +13143,7 @@
       <author><first>Yi</first><last>Liu</last><affiliation>Peking University</affiliation></author>
       <author><first>Yuxiang</first><last>Wang</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Sishuo</first><last>Chen</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Xu</first><last>Sun</last></author>
       <author><first>Lu</first><last>Hou</last><affiliation>Huawei Technologies Ltd.</affiliation></author>
@@ -15929,7 +15929,7 @@
       <author><first>Fei</first><last>Yuan</last></author>
       <author orcid="0000-0001-6730-5755"><first>Shuai</first><last>Yuan</last></author>
       <author><first>Zhiyong</first><last>Wu</last><affiliation>Shanghai Artificial Intelligence Laboratory</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>12111-12130</pages>
       <abstract>Large Language Models (LLMs), often show strong performance on English tasks, while exhibiting limitations on other languages. What is an LLM’s multilingual capability when it is trained only on certain languages? The underlying mechanism remains unclear. This study endeavors to examine the multilingual capability of LLMs from the vocabulary sharing perspective by conducting an exhaustive analysis across 101 languages. Through the investigation of the performance gap before and after embedding fine-tuning, we discovered four distinct quadrants. By delving into each quadrant we provide actionable and efficient guidelines for tuning these languages. Extensive experiments reveal that existing LLMs possess multilingual capabilities that surpass our expectations, and we can significantly improve the multilingual performance of LLMs based on these attributes of each quadrant .</abstract>
       <url hash="82a5134c">2024.findings-acl.721</url>
@@ -18707,7 +18707,7 @@
       <author><first>Zhenqiao</first><last>Song</last></author>
       <author orcid="0000-0002-7122-3493"><first>Taiqi</first><last>He</last></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>15654-15669</pages>
       <abstract>How can large language models (LLMs) process and translate endangered languages? Many languages lack a large corpus to train a decent LLM; therefore existing LLMs rarely perform well in unseen, endangered languages. On the contrary, we observe that 2000 endangered languages, though without a large corpus, have a grammar book or a dictionary. We propose LingoLLM, a training-free approach to enable an LLM to process unseen languages that hardly occur in its pre-training. Our key insight is to demonstrate linguistic knowledge of an unseen language in an LLM’s prompt, including a dictionary, a grammar book, and morphologically analyzed input text. We implement LingoLLM on top of two models, GPT-4 and Mixtral, and evaluate their performance on 5 tasks across 8 endangered or low-resource languages. Our results show that LingoLLM elevates translation capability from GPT-4’s 0 to 10.5 BLEU for 10 language directions. Our findings demonstrate the tremendous value of linguistic knowledge in the age of LLMs for endangered languages. Our data, code, and model generations will be released to the public. Our data, code, and model generations can be found at <url>https://github.com/LLiLab/llm4endangeredlang</url>.</abstract>
       <url hash="49f5a574">2024.findings-acl.925</url>
@@ -19577,7 +19577,7 @@
       <author><first>Babak</first><last>Damavandi</last></author>
       <author orcid="0009-0001-2049-2458"><first>Xin Luna</first><last>Dong</last><affiliation>Facebook</affiliation></author>
       <author orcid="0000-0003-2996-9790"><first>Christos</first><last>Faloutsos</last><affiliation>Amazon and Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Seungwhan</first><last>Moon</last><affiliation>Facebook</affiliation></author>
       <pages>247-266</pages>
       <abstract>Vision-extended LLMs have made significant strides in Visual Question Answering (VQA). Despite these advancements, VLLMs still encounter substantial difficulties in handling queries involving long-tail entities, with a tendency to produce erroneous or hallucinated responses. In this work, we introduce a novel evaluative benchmark named <b>SnapNTell</b>, specifically tailored for entity-centric VQA. This task aims to test the models’ capabilities in identifying entities and providing detailed, entity-specific knowledge. We have developed the <b>SnapNTell Dataset</b>, distinct from traditional VQA datasets: (1) It encompasses a wide range of categorized entities, each represented by images and explicitly named in the answers; (2) It features QA pairs that require extensive knowledge for accurate responses. The dataset is organized into 22 major categories, containing 7,568 unique entities in total. For each entity, we curated 10 illustrative images and crafted 10 knowledge-intensive QA pairs. To address this novel task, we devised a scalable, efficient, and transparent retrieval-augmented multimodal LLM. Our approach markedly outperforms existing methods on the SnapNTell dataset, achieving a 66.5% improvement in the BELURT score.</abstract>
@@ -24567,7 +24567,7 @@ and high variation in performance on the subset, suggesting our plausibility cri
       <author orcid="0000-0002-8105-7986"><first>João DS</first><last>Marques</last><affiliation>Instituto Superior Técnico and INESC-ID</affiliation></author>
       <author><first>Miguel</first><last>Graça</last></author>
       <author><first>Miguel</first><last>Freire</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0001-8638-5594"><first>Arlindo L.</first><last>Oliveira</last></author>
       <pages>6473-6486</pages>
       <abstract>Modern NLP tasks increasingly rely on dense retrieval methods to access up-to-date and relevant contextual information. We are motivated by the premise that retrieval benefits from segments that can vary in size such that a content’s semantic independence is better captured. We propose LumberChunker, a method leveraging an LLM to dynamically segment documents, which iteratively prompts the LLM to identify the point within a group of sequential passages where the content begins to shift. To evaluate our method, we introduce GutenQA, a benchmark with 3000 “needle in a haystack” type of question-answer pairs derived from 100 public domain narrative books available on Project Gutenberg. Our experiments show that LumberChunker not only outperforms the most competitive baseline by 7.37% in retrieval performance (DCG@20) but also that, when integrated into a RAG pipeline, LumberChunker proves to be more effective than other chunking methods and competitive baselines, such as the Gemini 1.5M Pro.</abstract>
@@ -28060,7 +28060,7 @@ and high variation in performance on the subset, suggesting our plausibility cri
       <title><fixed-case>LL</fixed-case>a<fixed-case>MAX</fixed-case>: Scaling Linguistic Horizons of <fixed-case>LLM</fixed-case> by Enhancing Translation Capabilities Beyond 100 Languages</title>
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
       <author><first>Wenhao</first><last>Zhu</last><affiliation>Nanjing University</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0002-1889-2567"><first>Yu</first><last>Qiao</last></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <pages>10748-10772</pages>
@@ -32433,7 +32433,7 @@ hai-coaching/</abstract>
     <paper id="956">
       <title><fixed-case>H</fixed-case>yper<fixed-case>L</fixed-case>o<fixed-case>RA</fixed-case>: Efficient Cross-task Generalization via Constrained Low-Rank Adapters Generation</title>
       <author><first>Chuancheng</first><last>Lv</last><affiliation>Tsinghua University, Tsinghua University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Shitou</first><last>Zhang</last></author>
       <author orcid="0000-0002-6671-2903"><first>Gang</first><last>Chen</last></author>
       <author orcid="0000-0002-4400-4033"><first>Fanchao</first><last>Qi</last></author>
diff --git a/data/xml/2024.iwslt.xml b/data/xml/2024.iwslt.xml
index 4384df4c78..a824817398 100644
--- a/data/xml/2024.iwslt.xml
+++ b/data/xml/2024.iwslt.xml
@@ -328,7 +328,7 @@
       <author><first>Brian</first><last>Yan</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Patrick</first><last>Fernandes</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Chen</last><affiliation>Carnegie Mellon University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Graham</first><last>Neubig</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Shinji</first><last>Watanabe</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>154-159</pages>
@@ -366,7 +366,7 @@
       <author><first>Siqi</first><last>Ouyang</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Chen</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Karen</first><last>Livescu</last><affiliation>TTI-Chicago</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Graham</first><last>Neubig</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Shinji</first><last>Watanabe</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>164-169</pages>
diff --git a/data/xml/2024.lrec.xml b/data/xml/2024.lrec.xml
index 94b70df131..2b6c32c612 100644
--- a/data/xml/2024.lrec.xml
+++ b/data/xml/2024.lrec.xml
@@ -9082,7 +9082,7 @@
       <author><first>Qing</first><last>Yang</last></author>
       <author><first>Dongliang</first><last>Xu</last></author>
       <author><first>Yanquan</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yuze</first><last>Li</last></author>
       <author><first>Yingqi</first><last>Zhu</last></author>
       <pages>8792–8803</pages>
@@ -10424,7 +10424,7 @@
     </paper>
     <paper id="886">
       <title>Large Language Models for Generative Recommendation: A Survey and Visionary Discussions</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <author><first>Dugang</first><last>Liu</last></author>
       <author><first>Li</first><last>Chen</last></author>
diff --git a/data/xml/2024.naacl.xml b/data/xml/2024.naacl.xml
index 4f3494d646..134e936cfb 100644
--- a/data/xml/2024.naacl.xml
+++ b/data/xml/2024.naacl.xml
@@ -8700,7 +8700,7 @@
       <author><first>Muhao</first><last>Chen</last><affiliation>UC Davis</affiliation></author>
       <author><first>Chaowei</first><last>Xiao</last><affiliation>UW-Madison</affiliation></author>
       <author><first>Huan</first><last>Sun</last><affiliation>OSU</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>CMU</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>CMU</affiliation></author>
       <author><first>Leon</first><last>Derczynski</last><affiliation>UW Seattle</affiliation></author>
       <author><first>Anima</first><last>Anandkumar</last><affiliation>Caltech, NVIDIA</affiliation></author>
       <author><first>Fei</first><last>Wang</last><affiliation>USC</affiliation></author>
diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index 7e21d6cd67..785a06210b 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -4615,7 +4615,7 @@
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
       <author><first>Chenwen</first><last>Liao</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last><affiliation>University of California, San Diego</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>6304-6316</pages>
       <abstract>Text watermarks in large language models (LLMs) are increasingly used to detect synthetic text, mitigating misuse cases like fake news and academic dishonesty. While existing watermarking detection techniques primarily focus on classifying entire documents as watermarked or not, they often neglect the common scenario of identifying individual watermark segments within longer, mixed-source documents. Drawing inspiration from plagiarism detection systems, we propose two novel methods for partial watermark detection. First, we develop a geometry cover detection framework aimed at determining whether there is a watermark segment in long text. Second, we introduce an adaptive online learning algorithm to pinpoint the precise location of watermark segments within the text. Evaluated on three popular watermarking techniques (KGW-Watermark, Unigram-Watermark, and Gumbel-Watermark), our approach achieves high accuracy, significantly outperforming baseline methods. Moreover, our framework is adaptable to other watermarking techniques, offering new insights for precise watermark detection. Our code is publicly available at <url>https://github.com/XuandongZhao/llm-watermark-location</url>.</abstract>
       <url hash="9643033f">2025.acl-long.316</url>
@@ -11968,7 +11968,7 @@
       <author orcid="0000-0003-4183-7053"><first>Tianfang</first><last>Zhang</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Zongkai</first><last>Wu</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>16780-16790</pages>
       <abstract>Large Language Models (LLMs) have demonstrated impressive capabilities in reasoning tasks, yet their reliance on static prompt structures and limited adaptability to complex scenarios remains a major challenge. In this paper, we propose the **Deductive and Inductive (DID)** method, a novel framework that enhances LLM reasoning by dynamically integrating both deductive and inductive reasoning approaches. Drawing from cognitive science principles, DID implements a dual-metric complexity evaluation system that combines Littlestone dimension and information entropy to precisely assess task difficulty and guide decomposition strategies. DID enables the model to progressively adapt its reasoning pathways based on problem complexity, mirroring human cognitive processes. We evaluate DID’s effectiveness across multiple benchmarks, including the AIW, MR-GSM8K, and our custom Holiday Puzzle dataset for temporal reasoning. Our results demonstrate great improvements in reasoning quality and solution accuracy - achieving 70.3% accuracy on AIW (compared to 62.2% for Tree of Thought), while maintaining lower computational costs.</abstract>
       <url hash="41c46401">2025.acl-long.820</url>
@@ -17060,7 +17060,7 @@
     </paper>
     <paper id="1169">
       <title>Uncertainty-Aware Iterative Preference Optimization for Enhanced <fixed-case>LLM</fixed-case> Reasoning</title>
-      <author><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Hehuan</first><last>Liu</last></author>
       <author orcid="0009-0004-2935-0749"><first>Yaxin</first><last>Zhou</last></author>
       <author><first>ZhaoYang</first><last>Gui</last><affiliation>Tencent</affiliation></author>
@@ -19239,7 +19239,7 @@
       <title>Benchmarking Long-Context Language Models on Long Code Understanding</title>
       <author><first>Jia</first><last>Li</last></author>
       <author><first>Xuyuan</first><last>Guo</last><affiliation>Peking University</affiliation></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Kechi</first><last>Zhang</last><affiliation>Peking University</affiliation></author>
       <author><first>Ge</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0002-5579-8852"><first>Jia</first><last>Li</last><affiliation>Tsinghua University</affiliation></author>
@@ -23304,7 +23304,7 @@
     <paper id="1603">
       <title>Design Choices for Extending the Context Length of Visual Language Models</title>
       <author><first>Mukai</first><last>Li</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0001-5028-2323"><first>Shansan</first><last>Gong</last></author>
       <author orcid="0000-0003-4608-5778"><first>Qi</first><last>Liu</last><affiliation>University of Hong Kong</affiliation></author>
       <pages>33425-33438</pages>
diff --git a/data/xml/2025.coling.xml b/data/xml/2025.coling.xml
index 5ff4b44d22..a7ac61845a 100644
--- a/data/xml/2025.coling.xml
+++ b/data/xml/2025.coling.xml
@@ -6219,7 +6219,7 @@
       <author><first>Zhaojiang</first><last>Lin</last></author>
       <author><first>Yuning</first><last>Mao</last></author>
       <author><first>William Yang</first><last>Wang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Yi-Chia</first><last>Wang</last></author>
       <pages>7819–7830</pages>
       <abstract>From ice cream flavors to climate change, people exhibit a wide array of opinions on various topics, and understanding the rationale for these opinions can promote healthy discussion and consensus among them. As such, it can be valuable for a large language model (LLM), particularly as an AI assistant, to be able to empathize with or even explain these various standpoints. In this work, we hypothesize that different topic stances often manifest correlations that can be used to extrapolate to topics with unknown opinions. We explore various prompting and fine-tuning methods to improve an LLM’s ability to (a) extrapolate from opinions on known topics to unknown ones and (b) support their extrapolation with reasoning. Our findings suggest that LLMs possess inherent knowledge from training data about these opinion correlations, and with minimal data, the similarities between human opinions and model-extrapolated opinions can be improved by more than 50%. Furthermore, LLM can generate the reasoning process behind their extrapolation of opinions.</abstract>
diff --git a/data/xml/2025.emnlp.xml b/data/xml/2025.emnlp.xml
index 32787a68cc..d91a31816c 100644
--- a/data/xml/2025.emnlp.xml
+++ b/data/xml/2025.emnlp.xml
@@ -22082,7 +22082,7 @@
       <author orcid="0009-0007-1607-2948"><first>Sheng</first><last>Wang</last></author>
       <author><first>Jingwei</first><last>Dong</last><affiliation>the University of Hong Kong</affiliation></author>
       <author><first>Kai</first><last>Liu</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Jiahui</first><last>Gao</last></author>
       <author><first>Jiyue</first><last>Jiang</last></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
@@ -23892,7 +23892,7 @@
       <author><first>Xiaonan</first><last>Li</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ming</first><last>Zhong</last><affiliation>University of Illinois Urbana Champaign</affiliation></author>
       <author orcid="0000-0001-5028-2323"><first>Shansan</first><last>Gong</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0002-3152-5091"><first>Jun</first><last>Zhang</last><affiliation>ByteDance</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
@@ -25167,7 +25167,7 @@
       <author><first>Adam</first><last>Officer</last><affiliation>University of Pittsburgh Medical Center</affiliation></author>
       <author><first>Angela</first><last>Chen</last></author>
       <author><first>Yufei</first><last>Huang</last><affiliation>University of Pittsburgh</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>480-486</pages>
       <abstract>Comprehensive pathway datasets are essential resources for advancing biological research, yet constructing these datasets is labor intensive. Recognizing the labor-intensive nature of constructing these critical resources, we present BioGraphia, a web-based annotation platform designed to facilitate collaborative pathway graph annotation. BioGraphia supports multi-user collaboration with real-time monitoring, curation, and interactive pathway graph visualization. It enables users to directly annotate the nodes and relations on the candidate graph, guided by detailed instructions. The platform is further enhanced with a large language model that automatically generates explainable and span-aligned pre-annotation to accelerate the annotation process. Its modular design allows flexible integration of external knowledge bases, and customization of the definition of annotation schema and, to support adaptation to other graph-based annotation tasks. Code is available at <url>https://github.com/LeiLiLab/BioGraphia</url></abstract>
       <url hash="9e6b29ab">2025.emnlp-demos.34</url>
diff --git a/data/xml/2025.findings.xml b/data/xml/2025.findings.xml
index 3c597b3104..4538d945e4 100644
--- a/data/xml/2025.findings.xml
+++ b/data/xml/2025.findings.xml
@@ -3679,7 +3679,7 @@
       <title>A Practical Examination of <fixed-case>AI</fixed-case>-Generated Text Detectors for Large Language Models</title>
       <author><first>Brian</first><last>Tufts</last></author>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>4824-4841</pages>
       <abstract>The proliferation of large language models has raised growing concerns about their misuse, particularly in cases where AI-generated text is falsely attributed to human authors. Machine-generated content detectors claim to effectively identify such text under various conditions and from any language model. This paper critically evaluates these claims by assessing several popular detectors (RADAR, Wild, T5Sentinel, Fast-DetectGPT, PHD, LogRank, Binoculars) on a range of domains, datasets, and models that these detectors have not previously encountered. We employ various prompting strategies to simulate practical adversarial attacks, demonstrating that even moderate efforts can significantly evade detection. We emphasize the importance of the true positive rate at a specific false positive rate (TPR@FPR) metric and demonstrate that these detectors perform poorly in certain settings, with TPR@.01 as low as 0%. Our findings suggest that both trained and zero-shot detectors struggle to maintain high sensitivity while achieving a reasonable true positive rate.</abstract>
       <url hash="6ae6fd80">2025.findings-naacl.271</url>
@@ -5290,7 +5290,7 @@
       <author><first>Xi</first><last>Xu</last></author>
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>7062-7067</pages>
       <abstract>Simultaneous speech translation (SimulST) systems must balance translation quality with response time, making latency measurement crucial for evaluating their real-world performance. However, there has been a longstanding belief that current metrics yield unrealistically high latency measurements in unsegmented streaming settings. In this paper, we investigate this phenomenon, revealing its root cause in a fundamental misconception underlying existing latency evaluation approaches. We demonstrate that this issue affects not only streaming but also segment-level latency evaluation across different metrics. Furthermore, we propose a modification to correctly measure computation-aware latency for SimulST systems, addressing the limitations present in existing metrics.</abstract>
       <url hash="14a7f1e4">2025.findings-naacl.393</url>
@@ -8591,7 +8591,7 @@
       <title><fixed-case>I</fixed-case>nfini<fixed-case>SST</fixed-case>: Simultaneous Translation of Unbounded Speech with Large Language Model</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
       <author><first>Xi</first><last>Xu</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>3032-3046</pages>
       <abstract>Simultaneous translation of unbounded streaming speech remains a challenging problem due to the need for effectively processing the historical speech context and past translations so that quality and latency, including computation overhead, can be balanced. Most prior works assume pre-segmented speech, limiting their real-world applicability. In this paper, we propose InfiniSST, a novel approach that formulates SST as a multi-turn dialogue task, enabling seamless translation of unbounded speech. We construct translation trajectories and robust segments from MuST-C with multi-latency augmentation during training and develop a key-value (KV) cache management strategy to facilitate efficient inference. Experiments on MuST-C En-Es, En-De, and En-Zh demonstrate that InfiniSST reduces computation-aware latency by 0.5 to 1 second while maintaining the same translation quality compared to baselines. Ablation studies further validate the contributions of our data construction and cache management strategy. Code is released at https://github.com/LeiLiLab/InfiniSST.</abstract>
       <url hash="098c0c79">2025.findings-acl.157</url>
@@ -13785,7 +13785,7 @@
       <author><first>Zongkai</first><last>Wu</last></author>
       <author orcid="0000-0002-0914-2975"><first>John</first><last>Lee</last><affiliation>University of Edinburgh, University of Edinburgh</affiliation></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>10045-10056</pages>
       <abstract>In the rapidly evolving field of image generation, achieving precise control over generated content and maintaining semantic consistency remain significant limitations, particularly concerning grounding techniques and the necessity for model fine-tuning. To address these challenges, we propose BayesGenie, an off-the-shelf approach that integrates Large Language Models (LLMs) with Bayesian Optimization to facilitate precise and user-friendly image editing. Our method enables users to modify images through natural language descriptions without manual area marking, while preserving the original image’s semantic integrity. Unlike existing techniques that require extensive pre-training or fine-tuning, our approach demonstrates remarkable adaptability across various LLMs through its model-agnostic design. BayesGenie employs an adapted Bayesian optimization strategy to automatically refine the inference process parameters, achieving high-precision image editing with minimal user intervention. Through extensive experiments across diverse scenarios, we demonstrate that our framework outperforms existing methods in both editing accuracy and semantic preservation, as validated using different LLMs including Claude3 and GPT-4.</abstract>
       <url hash="e2f4f1c6">2025.findings-acl.523</url>
@@ -23213,7 +23213,7 @@
       <title><fixed-case>L</fixed-case>ego<fixed-case>MT</fixed-case>2: Selective Asynchronous Sharded Data Parallel Training for Massive Neural Machine Translation</title>
       <author><first>Fei</first><last>Yuan</last></author>
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <pages>23359-23376</pages>
       <abstract>It is a critical challenge to learn a single model for massive languages. Prior methods focus on increasing the model size and training data size. However, large models are difficult to optimize efficiently even with distributed parallel training and translation capacity can interfere among languages. To address the challenge, we propose LegoMT2, an efficient training approach with an asymmetric multi-way model architecture for massive multilingual neural machine translation. LegoMT2 shards 435 languages into 8 language-centric groups and attributes one local encoder for each group’s languages and a mix encoder-decoder for all languages. LegoMT2 trains the model through local data parallel and asynchronous distributed updating of parameters. LegoMT2 is 16.2<tex-math>\times</tex-math> faster than the distributed training method for M2M-100-12B (which only for 100 languages) while improving the translation performance by an average of 2.2 BLEU on <i>Flores-101</i>, especially performing better for low-resource languages .</abstract>
@@ -27104,7 +27104,7 @@
       <author><first>Jinyuan</first><last>Xu</last></author>
       <author><first>Xue</first><last>He</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>1736-1750</pages>
       <abstract>Understanding the decision-making processes of large language models (LLMs) is essential for their trustworthy development and deployment, however, current interpretability methods often face challenges such as low resolution and high computational cost. To address these limitations, we propose the Multi-Layer Attention Consistency Score (MACS), a novel, lightweight, and easily deployable heuristic for estimating the importance of input tokens in decoder-based models. MACS measures contributions of input tokens based on the consistency of maximal attention. Empirical evaluations demonstrate that MACS achieves a favorable trade-off between interpretability quality and computational efficiency, showing faithfulness comparable to complex techniques with a 22% decrease in VRAM usage and 30% reduction in latency.</abstract>
       <url hash="eb70da57">2025.findings-emnlp.91</url>
@@ -28380,7 +28380,7 @@
       <author><first>Xinglin</first><last>Zhang</last><affiliation>Medical Image Insights</affiliation></author>
       <author><first>Tao</first><last>Chen</last><affiliation>University of Waterloo</affiliation></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>3456-3467</pages>
       <abstract>Contrast-enhanced 3D Medical imaging (e.g., CT, MRI) leverages phase sequences to uncover temporal dynamics vital for diagnosing tumors, lesions, and vascular issues. However, current retrieval models primarily focus on spatial features, neglecting phase-specific progression detailed in clinical reports. We present the **Phase-aware Memory Network (PAMN)**, a novel framework enhancing 3D medical image retrieval by fusing imaging phases with diagnostic text. PAMN creates rich radiological representations that enhance diagnostic accuracy by combining image details with clinical report context, rigorously tested on a novel phase-series dataset of 12,230 hospital CT scans. PAMN achieves an effective balance of performance and scalability in 3D radiology retrieval, outperforming state-of-the-art baselines through the robust fusion of spatial, temporal, and textual information.</abstract>
       <url hash="61fe4336">2025.findings-emnlp.184</url>
@@ -38256,7 +38256,7 @@
       <author><first>Wenhao</first><last>Zhu</last><affiliation>ByteDance Inc.</affiliation></author>
       <author><first>Hanxu</first><last>Hu</last><affiliation>Microsoft Research</affiliation></author>
       <author orcid="0000-0001-8697-695X"><first>Conghui</first><last>He</last><affiliation>Shanghai AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0003-4869-0832"><first>Shujian</first><last>Huang</last><affiliation>Nanjing University</affiliation></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <pages>16751-16774</pages>
@@ -43657,7 +43657,7 @@
     </paper>
     <paper id="1305">
       <title><fixed-case>A</fixed-case>uto<fixed-case>MIR</fixed-case>: Effective Zero-Shot Medical Information Retrieval without Relevance Labels</title>
-      <author orcid="0000-0001-5660-0409"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0001-5660-0409" id="lei-li"><first>Lei</first><last>Li</last></author>
       <author orcid="0009-0006-0306-8168"><first>Xiangxu</first><last>Zhang</last><affiliation>Renmin University of China</affiliation></author>
       <author orcid="0000-0002-0868-764X"><first>Xiao</first><last>Zhou</last></author>
       <author orcid="0000-0001-7765-8466"><first>Zheng</first><last>Liu</last></author>
diff --git a/data/xml/2025.iwslt.xml b/data/xml/2025.iwslt.xml
index dafa1acfc8..1696407540 100644
--- a/data/xml/2025.iwslt.xml
+++ b/data/xml/2025.iwslt.xml
@@ -406,7 +406,7 @@
       <title><fixed-case>CMU</fixed-case>’s <fixed-case>IWSLT</fixed-case> 2025 Simultaneous Speech Translation System</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Xi</first><last>Xu</last><affiliation>Carnegie Mellon University</affiliation></author>
-      <author><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>309-314</pages>
       <abstract>This paper presents CMU’s submission to the IWSLT 2025 Simultaneous Speech Translation (SST) task for translating unsegmented English speech into Chinese and German text in a streaming manner. Our end-to-end speech-to-text system integrates a chunkwise causal Wav2Vec 2.0 speech encoder, an adapter, and the Qwen2.5-7B-Instruct as the decoder. We use a two-stage simultaneous training procedure on robust speech segments synthesized from LibriSpeech, CommonVoice, and VoxPopuli datasets, utilizing standard cross-entropy loss. Our model supports adjustable latency through a configurable latency multiplier. Experimental results demonstrate that our system achieves 44.3 BLEU for English-to-Chinese and 25.1 BLEU for English-to-German translations on the ACL60/60 development set, with computation-aware latencies of 2.7 seconds and 2.3 seconds, and theoretical latencies of 2.2 and 1.7 seconds, respectively.</abstract>
       <url hash="d0c14aba">2025.iwslt-1.31</url>
diff --git a/data/xml/2025.naacl.xml b/data/xml/2025.naacl.xml
index b6e65a2d99..1a63346744 100644
--- a/data/xml/2025.naacl.xml
+++ b/data/xml/2025.naacl.xml
@@ -1282,7 +1282,7 @@
       <author orcid="0000-0001-8161-6429"><first>Siyu</first><last>Yuan</last></author>
       <author><first>Kai</first><last>Zhang</last></author>
       <author><first>Yikai</first><last>Zhang</last></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0001-8403-9591"><first>Yanghua</first><last>Xiao</last><affiliation>Fudan University</affiliation></author>
       <pages>1872-1888</pages>
       <abstract>Autonomous planning has been an ongoing pursuit since the inception of artificial intelligence. Based on curated problem solvers, early planning agents could deliver precise solutions for specific tasks but lacked generalization. The emergence of large language models (LLMs) and their powerful reasoning capabilities has reignited interest in autonomous planning by automatically generating reasonable solutions for given tasks. However, prior research and our experiments show that current language agents still lack human-level planning abilities. Even the state-of-the-art reasoning model, OpenAI o1, achieves only 15.6% on one of the complex real-world planning benchmarks. This highlights a critical question: What hinders language agents from achieving human-level planning? Although existing studies have highlighted weak performance in agent planning, the deeper underlying issues and the mechanisms and limitations of the strategies proposed to address them remain insufficiently understood. In this work, we apply the feature attribution study and identify two key factors that hinder agent planning: the limited role of constraints and the diminishing influence of questions. We also find that although current strategies help mitigate these challenges, they do not fully resolve them, indicating that agents still have a long way to go before reaching human-level intelligence.</abstract>
@@ -3938,7 +3938,7 @@
       <author><first>Zhehuai</first><last>Chen</last></author>
       <author><first>Vitaly</first><last>Lavrukhin</last><affiliation>NVIDIA</affiliation></author>
       <author><first>Jagadeesh</first><last>Balam</last><affiliation>NVIDIA</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Boris</first><last>Ginsburg</last><affiliation>NVIDIA</affiliation></author>
       <pages>5547-5557</pages>
       <abstract>Simultaneous machine translation (SMT) takes streaming input utterances and incrementally produces target text. Existing SMT methods only use the partial utterance that has already arrived at the input and the generated hypothesis. Motivated by human interpreters’ technique to forecast future words before hearing them, we propose Translation by Anticipating Future (TAF), a method to improve translation quality while retaining low latency. Its core idea is to use a large language model (LLM) to predict future source words and opportunistically translate without introducing too much risk. We evaluate our TAF and multiple baselines of SMT on four language directions. Experiments show that TAF achieves the best translation quality-latency trade-off and outperforms the baselines by up to 5 BLEU points at the same latency (three words).</abstract>
@@ -4961,7 +4961,7 @@
       <title><fixed-case>I</fixed-case>mg<fixed-case>T</fixed-case>rojan: Jailbreaking Vision-Language Models with <fixed-case>ONE</fixed-case> Image</title>
       <author><first>Xijia</first><last>Tao</last></author>
       <author><first>Shuai</first><last>Zhong</last></author>
-      <author orcid="0009-0008-6984-5104"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0003-4608-5778"><first>Qi</first><last>Liu</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
       <pages>7048-7063</pages>
@@ -5567,7 +5567,7 @@
       <author><first>Shang</first><last>Zhou</last></author>
       <author><first>Danqing</first><last>Wang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>7959-7973</pages>
       <abstract>Sampling is a basic operation for large language models (LLMs). In reinforcement learning rollouts and meta generation algorithms such as Best-of-N, it is essential to sample correct trajectories within a given compute budget. To find an optimal allocation for sample compute budgets, several choices need to be made:Which sampling configurations (model, temperature, language, etc.) to use?How many samples to generate in each configuration?We formulate these choices as a learning problem and propose OSCA, an algorithm that Optimizes Sample Compute Allocation by finding an optimal mix of different inference configurations.Our experiments show that with our learned mixed allocation, we can achieve accuracy better than the best single configuration with 128x less compute on code generation and 25x less compute on 4 reasoning tasks.is also shown to be effective in agentic workflows beyond single-turn tasks, achieving a better accuracy on SWE-Bench with 3x less compute than the default configuration.Our code and generations are released at https://github.com/LeiLiLab/OSCA.</abstract>
       <url hash="e548881c">2025.naacl-long.404</url>
@@ -6287,7 +6287,7 @@
       <author><first>Chang</first><last>Ma</last></author>
       <author orcid="0000-0001-6730-5755"><first>Shuai</first><last>Yuan</last></author>
       <author orcid="0000-0002-5207-818X"><first>Qiushi</first><last>Sun</last><affiliation>University of Hong Kong</affiliation></author>
-      <author orcid="0000-0003-3095-9776"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>9077-9090</pages>
       <abstract>The lottery ticket hypothesis posits the existence of “winning tickets” within a randomly initialized neural network. Do winning tickets exist for LLMs in fine-tuning scenarios? How can we find such winning tickets? In this paper, we propose KS-Lottery, a method to identify a small subset of LLM parameters highly effective in multilingual fine-tuning. Our key idea is to use Kolmogorov-Smirnov Test to analyze the distribution shift of parameters before and after fine-tuning. We further theoretically prove that KS-Lottery can find the certified winning tickets in the embedding layer, fine-tuning on the found parameters is guaranteed to perform as well as full fine-tuning. Comparing KS-Lottery with other tuning algorithms on translation tasks, the experimental results show that KS-Lottery finds a much smaller set of parameters for fine-tuning while achieving the comparable performance as full fine-tuning LLM. Surprisingly, we find that fine-tuning 18 tokens’ embedding of LLaMA suffices to reach the fine-tuning translation performance .</abstract>
       <url hash="416c92fd">2025.naacl-long.458</url>
diff --git a/data/xml/D18.xml b/data/xml/D18.xml
index 8f6b6858aa..d995e57508 100644
--- a/data/xml/D18.xml
+++ b/data/xml/D18.xml
@@ -6212,7 +6212,7 @@
       <author><first>Haoyue</first><last>Shi</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>4631–4641</pages>
       <url hash="5e10b91f">D18-1492</url>
       <attachment type="attachment" hash="5aea7c87">D18-1492.Attachment.zip</attachment>
diff --git a/data/xml/D19.xml b/data/xml/D19.xml
index 5848dd445b..061437e9ca 100644
--- a/data/xml/D19.xml
+++ b/data/xml/D19.xml
@@ -953,7 +953,7 @@
       <author><first>Zhixing</first><last>Tan</last></author>
       <author><first>Jinsong</first><last>Su</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>803–812</pages>
       <abstract>In this study, we first investigate a novel capsule network with dynamic routing for linear time Neural Machine Translation (NMT), referred as CapsNMT. CapsNMT uses an aggregation mechanism to map the source sentence into a matrix with pre-determined size, and then applys a deep LSTM network to decode the target sequence from the source representation. Unlike the previous work (CITATION) to store the source sentence with a passive and bottom-up way, the dynamic routing policy encodes the source sentence with an iterative process to decide the credit attribution between nodes from lower and higher layers. CapsNMT has two core properties: it runs in time that is linear in the length of the sequences and provides a more flexible way to aggregate the part-whole information of the source sentence. On WMT14 English-German task and a larger WMT14 English-French task, CapsNMT achieves comparable results with the Transformer system. To the best of our knowledge, this is the first work that capsule networks have been empirically investigated for sequence to sequence problems.</abstract>
       <url hash="08fdfea0">D19-1074</url>
@@ -4288,7 +4288,7 @@
       <author><first>Fuli</first><last>Luo</last></author>
       <author><first>Shunyao</first><last>Li</last></author>
       <author><first>Pengcheng</first><last>Yang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
       <author><first>Zhifang</first><last>Sui</last></author>
       <author><first>Xu</first><last>Sun</last></author>
@@ -8707,7 +8707,7 @@ The tutorial will bring researchers and practitioners to be aware of this issue,
       <title>Discreteness in Neural Natural Language Processing</title>
       <author><first>Lili</first><last>Mou</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <abstract>This tutorial provides a comprehensive guide to the process of discreteness in neural NLP.
 
 As a gentle start, we will briefly introduce the background of deep learning based NLP, where we point out the ubiquitous discreteness of natural language and its challenges in neural information processing. Particularly, we will focus on how such discreteness plays a role in the input space, the latent space, and the output space of a neural network. In each part, we will provide examples, discuss machine learning techniques, as well as demonstrate NLP applications.</abstract>
diff --git a/data/xml/K19.xml b/data/xml/K19.xml
index bd138b9624..a909084b16 100644
--- a/data/xml/K19.xml
+++ b/data/xml/K19.xml
@@ -955,7 +955,7 @@
     </paper>
     <paper id="77">
       <title>In Conclusion Not Repetition: Comprehensive Abstractive Summarization with Diversified Attention Based on Determinantal Point Processes</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
       <author><first>Marina</first><last>Litvak</last></author>
       <author><first>Natalia</first><last>Vanetik</last></author>
diff --git a/data/xml/N18.xml b/data/xml/N18.xml
index 9422c64272..1d475291bb 100644
--- a/data/xml/N18.xml
+++ b/data/xml/N18.xml
@@ -1409,7 +1409,7 @@
     <paper id="113">
       <title>Reinforced Co-Training</title>
       <author><first>Jiawei</first><last>Wu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>William Yang</first><last>Wang</last></author>
       <pages>1252–1262</pages>
       <abstract>Co-training is a popular semi-supervised learning framework to utilize a large amount of unlabeled data in addition to a small labeled set. Co-training methods exploit predicted labels on the unlabeled data and select samples based on prediction confidence to augment the training. However, the selection of samples in existing co-training methods is based on a predetermined policy, which ignores the sampling bias between the unlabeled and the labeled subsets, and fails to explore the data space. In this paper, we propose a novel method, Reinforced Co-Training, to select high-quality unlabeled samples to better co-train on. More specifically, our approach uses Q-learning to learn a data selection policy with a small labeled dataset, and then exploits this policy to train the co-training classifiers automatically. Experimental results on clickbait detection and generic text classification tasks demonstrate that our proposed method can obtain more accurate text classification results.</abstract>
diff --git a/data/xml/P16.xml b/data/xml/P16.xml
index 5dcb56b7d4..4010ce6a2d 100644
--- a/data/xml/P16.xml
+++ b/data/xml/P16.xml
@@ -817,7 +817,7 @@
     <paper id="76">
       <title><fixed-case>CFO</fixed-case>: Conditional Focused Neural Question Answering with Large-scale Knowledge Bases</title>
       <author><first>Zihang</first><last>Dai</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Wei</first><last>Xu</last></author>
       <pages>800–810</pages>
       <url hash="0526478f">P16-1076</url>
diff --git a/data/xml/P19.xml b/data/xml/P19.xml
index 0cdab3ee01..973cf97486 100644
--- a/data/xml/P19.xml
+++ b/data/xml/P19.xml
@@ -2488,7 +2488,7 @@
     <paper id="193">
       <title>Enhancing Topic-to-Essay Generation with External Commonsense Knowledge</title>
       <author><first>Pengcheng</first><last>Yang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Fuli</first><last>Luo</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Xu</first><last>Sun</last></author>
@@ -3286,7 +3286,7 @@
       <author><first>Pengcheng</first><last>Yang</last></author>
       <author id="zhihan-zhang"><first>Zhihan</first><last>Zhang</last></author>
       <author><first>Fuli</first><last>Luo</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Chengyang</first><last>Huang</last></author>
       <author><first>Xu</first><last>Sun</last></author>
       <pages>2680–2686</pages>
@@ -7124,7 +7124,7 @@
       <author><first>Huangzhao</first><last>Zhang</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Ning</first><last>Miao</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>5564–5569</pages>
       <abstract>Efficiently building an adversarial attacker for natural language processing (NLP) tasks is a real challenge. Firstly, as the sentence space is discrete, it is difficult to make small perturbations along the direction of gradients. Secondly, the fluency of the generated examples cannot be guaranteed. In this paper, we propose MHA, which addresses both problems by performing Metropolis-Hastings sampling, whose proposal is designed with the guidance of gradients. Experiments on IMDB and SNLI show that our proposed MHAoutperforms the baseline model on attacking capability. Adversarial training with MHA also leads to better robustness and performance.</abstract>
       <url hash="ccbfd155">P19-1559</url>
@@ -7669,7 +7669,7 @@
       <author><first>Yu</first><last>Bao</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Lili</first><last>Mou</last></author>
       <author><first>Olga</first><last>Vechtomova</last></author>
       <author><first>Xin-yu</first><last>Dai</last></author>
@@ -7853,7 +7853,7 @@
       <author><first>Yunxuan</first><last>Xiao</last></author>
       <author><first>Yanru</first><last>Qu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
       <pages>6140–6150</pages>
@@ -8732,7 +8732,7 @@
       <title>Automatic Generation of Personalized Comment Based on User Profile</title>
       <author><first>Wenhuan</first><last>Zeng</last></author>
       <author><first>Abulikemu</first><last>Abuduweili</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Pengcheng</first><last>Yang</last></author>
       <pages>229–235</pages>
       <abstract>Comments on social media are very diverse, in terms of content, style and vocabulary, which make generating comments much more challenging than other existing natural language generation (NLG) tasks. Besides, since different user has different expression habits, it is necessary to take the user’s profile into consideration when generating comments. In this paper, we introduce the task of automatic generation of personalized comment (AGPC) for social media. Based on tens of thousands of users’ real comments and corresponding user profiles on weibo, we propose Personalized Comment Generation Network (PCGN) for AGPC. The model utilizes user feature embedding with a gated memory and attends to user description to model personality of users. In addition, external user representation is taken into consideration during the decoding to enhance the comments generation. Experimental results show that our model can generate natural, human-like and personalized comments.</abstract>
diff --git a/data/xml/W13.xml b/data/xml/W13.xml
index b3a11bbd51..351599ba29 100644
--- a/data/xml/W13.xml
+++ b/data/xml/W13.xml
@@ -5020,7 +5020,7 @@
     </frontmatter>
     <paper id="1">
       <title>Multi-document multilingual summarization corpus preparation, Part 1: <fixed-case>A</fixed-case>rabic, <fixed-case>E</fixed-case>nglish, <fixed-case>G</fixed-case>reek, <fixed-case>C</fixed-case>hinese, <fixed-case>R</fixed-case>omanian</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Corina</first><last>Forascu</last></author>
       <author><first>Mahmoud</first><last>El-Haj</last></author>
       <author><first>George</first><last>Giannakopoulos</last></author>
@@ -5056,7 +5056,7 @@
     </paper>
     <paper id="5">
       <title><fixed-case>CIST</fixed-case> System Report for <fixed-case>ACL</fixed-case> <fixed-case>M</fixed-case>ulti<fixed-case>L</fixed-case>ing 2013 – Track 1: Multilingual Multi-document Summarization</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Wei</first><last>Heng</last></author>
       <author><first>Jia</first><last>Yu</last></author>
       <author><first>Yu</first><last>Liu</last></author>
diff --git a/data/xml/W14.xml b/data/xml/W14.xml
index 493fcd347b..9cdb41c81d 100644
--- a/data/xml/W14.xml
+++ b/data/xml/W14.xml
@@ -11786,7 +11786,7 @@
       <author><first>Xiaoyue</first><last>Cong</last></author>
       <author><first>Fang</first><last>Huang</last></author>
       <author><first>Hongfa</first><last>Xue</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Zhiqiao</first><last>Gao</last></author>
       <pages>114–119</pages>
       <url hash="e0444f31">W14-6818</url>
diff --git a/data/xml/W16.xml b/data/xml/W16.xml
index 41fd606e0d..33d4e950d9 100644
--- a/data/xml/W16.xml
+++ b/data/xml/W16.xml
@@ -2289,7 +2289,7 @@
     </paper>
     <paper id="18">
       <title><fixed-case>CIST</fixed-case> System for <fixed-case>CL</fixed-case>-<fixed-case>S</fixed-case>ci<fixed-case>S</fixed-case>umm 2016 Shared Task</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Liyuan</first><last>Mao</last></author>
       <author><first>Yazhao</first><last>Zhang</last></author>
       <author><first>Junqi</first><last>Chi</last></author>
diff --git a/data/xml/W17.xml b/data/xml/W17.xml
index 06300c5187..4e65bc6b2b 100644
--- a/data/xml/W17.xml
+++ b/data/xml/W17.xml
@@ -1679,7 +1679,7 @@
     </paper>
     <paper id="5">
       <title>Word Embedding and Topic Modeling Enhanced Multiple Features for Content Linking and Argument / Sentiment Labeling in Online Forums</title>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Liyuan</first><last>Mao</last></author>
       <author><first>Moye</first><last>Chen</last></author>
       <pages>32–36</pages>
@@ -4186,7 +4186,7 @@ is able to handle phenomena related to scope by means of an higher-order type th
       <author><first>Danchen</first><last>Zhang</last></author>
       <author><first>Daqing</first><last>He</last></author>
       <author><first>Sanqiang</first><last>Zhao</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>263–271</pages>
       <url hash="91659678">W17-2333</url>
       <doi>10.18653/v1/W17-2333</doi>
diff --git a/data/xml/W19.xml b/data/xml/W19.xml
index 441404c593..51ef0d3e4e 100644
--- a/data/xml/W19.xml
+++ b/data/xml/W19.xml
@@ -17436,7 +17436,7 @@ In this tutorial on MT and post-editing we would like to continue sharing the la
       <author><first>Yao</first><last>Fu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>24–33</pages>
       <abstract>Text attribute transfer is modifying certain linguistic attributes (e.g. sentiment, style, author-ship, etc.) of a sentence and transforming them from one type to another. In this paper, we aim to analyze and interpret what is changed during the transfer process. We start from the observation that in many existing models and datasets, certain words within a sentence play important roles in determining the sentence attribute class. These words are referred as the Pivot Words. Based on these pivot words, we propose a lexical analysis framework, the Pivot Analysis, to quantitatively analyze the effects of these words in text attribute classification and transfer. We apply this framework to existing datasets and models and show that: (1) the pivot words are strong features for the classification of sentence attributes; (2) to change the attribute of a sentence, many datasets only requires to change certain pivot words; (3) consequently, many transfer models only perform the lexical-level modification,while leaving higher-level sentence structures unchanged. Our work provides an in-depth understanding of linguistic attribute transfer and further identifies the future requirements and challenges of this task</abstract>
       <url hash="496b647a">W19-8604</url>
@@ -18512,7 +18512,7 @@ In this tutorial on MT and post-editing we would like to continue sharing the la
     <paper id="4">
       <title>Multi-lingual <fixed-case>W</fixed-case>ikipedia Summarization and Title Generation On Low Resource Corpus</title>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <author><first>Zuying</first><last>Huang</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
       <pages>17–25</pages>
diff --git a/data/xml/Y06.xml b/data/xml/Y06.xml
index 8d5cfaeb92..317f8c12a5 100644
--- a/data/xml/Y06.xml
+++ b/data/xml/Y06.xml
@@ -669,7 +669,7 @@
     <paper id="69">
       <title>Research on <fixed-case>O</fixed-case>lympics-oriented Mobile Game News Ordering System</title>
       <author><first>Yonggui</first><last>Yang</last></author>
-      <author><first>Lei</first><last>Li</last></author>
+      <author id="lei-li"><first>Lei</first><last>Li</last></author>
       <pages>459–462</pages>
       <url hash="98978250">Y06-1069</url>
       <doi>http://hdl.handle.net/2065/29047</doi>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 20ab849f87..07a967d937 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5738,6 +5738,9 @@
 - canonical: {first: Junhui, last: Li}
   variants:
   - {first: JunHui, last: Li}
+- canonical: {first: Lei, last: Li}
+  id: lei-li
+  comment: May refer to several people
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From b9db84b1b88c9aeb4129bc3f27f063ae7119f5f1 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Thu, 6 Nov 2025 22:54:33 +0100
Subject: [PATCH 02/19] Add Lei Li (CMU) and edit id for all orcid-tagged
 papers

- add Lei Li (Carnegie Mellon University) as a person including orcid (ending in `-9776`) and institution of degree
- change id for all papers with this orcid away from the catch-all to the specific `lei-li-cmu`
---
 data/xml/2022.acl.xml        |  8 ++++----
 data/xml/2022.findings.xml   |  8 ++++----
 data/xml/2022.naacl.xml      |  4 ++--
 data/xml/2023.acl.xml        |  8 ++++----
 data/xml/2023.findings.xml   |  2 +-
 data/xml/2024.emnlp.xml      |  8 ++++----
 data/xml/2024.findings.xml   | 10 +++++-----
 data/xml/2025.acl.xml        |  2 +-
 data/xml/2025.emnlp.xml      |  2 +-
 data/xml/2025.findings.xml   | 10 +++++-----
 data/xml/2025.naacl.xml      |  8 ++++----
 data/yaml/name_variants.yaml |  5 +++++
 12 files changed, 40 insertions(+), 35 deletions(-)

diff --git a/data/xml/2022.acl.xml b/data/xml/2022.acl.xml
index 4fab3c8f51..72e6ef489f 100644
--- a/data/xml/2022.acl.xml
+++ b/data/xml/2022.acl.xml
@@ -707,7 +707,7 @@
       <author><first>Qian</first><last>Dong</last></author>
       <author><first>Yaoming</first><last>Zhu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>680-694</pages>
       <abstract>How to find proper moments to generate partial sentence translation given a streaming speech input? Existing approaches waiting-and-translating for a fixed duration often break the acoustic units in speech, since the boundaries between acoustic units in speech are not even. In this paper, we propose MoSST, a simple yet effective method for translating streaming speech content. Given a usually long speech sequence, we develop an efficient monotonic segmentation module inside an encoder-decoder model to accumulate acoustic information incrementally and detect proper speech unit boundaries for the input in speech translation task. Experiments on multiple translation directions of the MuST-C dataset show that outperforms existing methods and achieves the best trade-off between translation quality (BLEU) and latency. Our code is available at <url>https://github.com/dqqcasia/mosst</url>.</abstract>
       <url hash="c3f93720">2022.acl-long.50</url>
@@ -2657,7 +2657,7 @@
       <author><first>Wangchunshu</first><last>Zhou</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2701-2714</pages>
       <abstract>Currently, masked language modeling (e.g., BERT) is the prime choice to learn contextualized representations. Due to the pervasiveness, it naturally raises an interesting question: how do masked language models (MLMs) learn contextual representations? In this work, we analyze the learning dynamics of MLMs and find that it adopts sampled embeddings as anchors to estimate and inject contextual semantics to representations, which limits the efficiency and effectiveness of MLMs. To address these problems, we propose TACO, a simple yet effective representation learning approach to directly model global semantics. To be specific, TACO extracts and aligns contextual semantics hidden in contextualized representations to encourage models to attend global semantics when generating contextualized representations. Experiments on the GLUE benchmark show that TACO achieves up to 5x speedup and up to 1.2 points average improvement over MLM.</abstract>
       <url hash="0b45c9f9">2022.acl-long.193</url>
@@ -6668,7 +6668,7 @@ in the Case of Unambiguous Gender</title>
       <title><fixed-case>STEMM</fixed-case>: Self-learning with Speech-text Manifold Mixup for Speech Translation</title>
       <author orcid="0000-0001-8575-591X"><first>Qingkai</first><last>Fang</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Yang</first><last>Feng</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <pages>7050-7062</pages>
@@ -7867,7 +7867,7 @@ in the Case of Unambiguous Gender</title>
       <author><first>Lihua</first><last>Qian</last></author>
       <author><first>Xinyu</first><last>Dai</last></author>
       <author><first>Jiajun</first><last>Chen</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>8398-8409</pages>
       <abstract>Recently, parallel text generation has received widespread attention due to its success in generation efficiency. Although many advanced techniques are proposed to improve its generation quality, they still need the help of an autoregressive model for training to overcome the one-to-many multi-modal phenomenon in the dataset, limiting their applications. In this paper, we propose GLAT, which employs the discrete latent variables to capture word categorical information and invoke an advanced curriculum learning technique, alleviating the multi-modality problem. Experiment results show that our method outperforms strong baselines without the help of an autoregressive model, which further broadens the application scenarios of the parallel decoding paradigm.</abstract>
       <url hash="2427c3b4">2022.acl-long.575</url>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 8678f386d4..3cf3a0f0f9 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -880,7 +880,7 @@
       <author><first>Xuandong</first><last>Zhao</last></author>
       <author><first>Zhiguo</first><last>Yu</last></author>
       <author><first>Ming</first><last>Wu</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>774-781</pages>
       <abstract>How to learn highly compact yet effective sentence representation? Pre-trained language models have been effective in many NLP tasks. However, these models are often huge and produce large sentence embeddings. Moreover, there is a big performance gap between large and small models. In this paper, we propose Homomorphic Projective Distillation (HPD) to learn compressed sentence embeddings. Our method augments a small Transformer encoder model with learnable projection layers to produce compact representations while mimicking a large pre-trained language model to retain the sentence representation quality. We evaluate our method with different model sizes on both semantic textual similarity (STS) and semantic retrieval (SR) tasks. Experiments show that our method achieves 2.7-4.5 points performance gain on STS tasks compared with previous best representations of the same size. In SR tasks, our method improves retrieval speed (8.2×) and memory usage (8.0×) compared with state-of-the-art large models. Our implementation is available at <url>https://github.com/XuandongZhao/HPD</url>.</abstract>
       <url hash="3c74a3f8">2022.findings-acl.64</url>
@@ -3803,7 +3803,7 @@
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
       <author><first>Jiajun</first><last>Chen</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>3537-3548</pages>
       <abstract>This paper does not aim at introducing a novel model for document-level neural machine translation. Instead, we head back to the original Transformer model and hope to answer the following question: Is the capacity of current models strong enough for document-level translation? Interestingly, we observe that the original Transformer with appropriate training techniques can achieve strong results for document translation, even with a length of 2000 words. We evaluate this model and several recent approaches on nine document-level datasets and two sentence-level datasets across six languages. Experiments show that document-level Transformer models outperforms sentence-level ones and many previous methods in a comprehensive set of metrics, including BLEU, four lexical indices, three newly proposed assistant linguistic indicators, and human evaluation.</abstract>
       <url hash="621a01ad">2022.findings-acl.279</url>
@@ -4226,7 +4226,7 @@
       <author><first>Zhongqiao</first><last>Li</last></author>
       <author><first>Xinbo</first><last>Zhang</last></author>
       <author><first>Changzhi</first><last>Sun</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Yanghua</first><last>Xiao</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <pages>3941-3955</pages>
@@ -7198,7 +7198,7 @@
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2508-2527</pages>
       <abstract>We introduce MTG, a new benchmark suite for training and evaluating multilingual text generation. It is the first-proposed multilingual multiway text generation dataset with the largest human-annotated data (400k). It includes four generation tasks (story generation, question generation, title generation and text summarization) across five languages (English, German, French, Spanish and Chinese). The multiway setup enables testing knowledge transfer capabilities for a model across languages and tasks. Using MTG, we train and analyze several popular multilingual generation models from different aspects. Our benchmark suite fosters model performance enhancement with more human-annotated parallel data. It provides comprehensive evaluations with diverse generation scenarios. Code and data are available at <url>https://github.com/zide05/MTG</url>.</abstract>
       <url hash="dad0ea74">2022.findings-naacl.192</url>
diff --git a/data/xml/2022.naacl.xml b/data/xml/2022.naacl.xml
index 6c56c243dc..1be30a3583 100644
--- a/data/xml/2022.naacl.xml
+++ b/data/xml/2022.naacl.xml
@@ -973,7 +973,7 @@
     <paper id="69">
       <title>Provably Confidential Language Modelling</title>
       <author><first>Xuandong</first><last>Zhao</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last></author>
       <pages>943-955</pages>
       <abstract>Large language models are shown to memorize privacy information such as social security numbers in training data. Given the sheer scale of the training corpus, it is challenging to screen and filter these privacy data, either manually or automatically. In this paper, we propose Confidentially Redacted Training (CRT), a method to train language generation models while protecting the confidential segments. We borrow ideas from differential privacy (which solves a related but distinct problem) and show that our method is able to provably prevent unintended memorization by randomizing parts of the training process. Moreover, we show that redaction with an approximately correct screening policy amplifies the confidentiality guarantee. We implement the method for both LSTM and GPT language models. Our experimental results show that the models trained by CRT obtain almost the same perplexity while preserving strong confidentiality.</abstract>
@@ -5242,7 +5242,7 @@
       <title>Cross-modal Contrastive Learning for Speech Translation</title>
       <author><first>Rong</first><last>Ye</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>5099-5113</pages>
       <abstract>How can we learn unified representations for spoken utterances and their written text? Learning similar representations for semantically similar speech and text is important for speech translation. To this end, we propose ConST, a cross-modal contrastive learning method for end-to-end speech-to-text translation. We evaluate ConST and a variety of previous baselines on a popular benchmark MuST-C. Experiments show that the proposed ConST consistently outperforms the previous methods, and achieves an average BLEU of 29.4. The analysis further verifies that ConST indeed closes the representation gap of different modalities — its learned representation improves the accuracy of cross-modal speech-text retrieval from 4% to 88%. Code and models are available at <url>https://github.com/ReneeYe/ConST</url>.</abstract>
       <url hash="049e5219">2022.naacl-main.376</url>
diff --git a/data/xml/2023.acl.xml b/data/xml/2023.acl.xml
index e0dcf75007..22590a6adf 100644
--- a/data/xml/2023.acl.xml
+++ b/data/xml/2023.acl.xml
@@ -3036,7 +3036,7 @@
       <title><fixed-case>WACO</fixed-case>: Word-Aligned Contrastive Learning for Speech Translation</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Rong</first><last>Ye</last><affiliation>ByteDance AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>3891-3907</pages>
       <abstract>End-to-end Speech Translation (E2E ST) aims to directly translate source speech into target text. Existing ST methods perform poorly when only extremely small speech-text data are available for training. We observe that an ST model’s performance closely correlates with its embedding similarity between speech and source transcript. In this paper, we propose Word-Aligned COntrastive learning (WACO), a simple and effective method for extremely low-resource speech-to-text translation. Our key idea is bridging word-level representations for both speech and text modalities via contrastive learning. We evaluate WACO and other methods on the MuST-C dataset, a widely used ST benchmark, and on a low-resource direction Maltese-English from IWSLT 2023. Our experiments demonstrate that WACO outperforms the best baseline by 9+ BLEU points with only 1-hour parallel ST data. Code is available at <url>https://github.com/owaski/WACO</url>.</abstract>
       <url hash="fb81ce2d">2023.acl-long.216</url>
@@ -4007,7 +4007,7 @@
       <author><first>Wenda</first><last>Xu</last><affiliation>University of California at Santa Barbara</affiliation></author>
       <author><first>Xian</first><last>Qian</last><affiliation>ByteDance AI LAB</affiliation></author>
       <author><first>Mingxuan</first><last>Wang</last><affiliation>Bytedance AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>Unversity of California, Santa Barbara</affiliation></author>
       <pages>5166-5183</pages>
       <abstract>Is it possible to train a general metric for evaluating text generation quality without human-annotated ratings? Existing learned metrics either perform unsatisfactory across text generation tasks or require human ratings for training on specific tasks. In this paper, we propose SEScore2, a self-supervised approach for training a model-based metric for text generation evaluation. The key concept is to synthesize realistic model mistakes by perturbing sentences retrieved from a corpus. We evaluate SEScore2 and previous methods on four text generation tasks across three languages. SEScore2 outperforms all prior unsupervised metrics on four text generation evaluation benchmarks, with an average Kendall improvement of 0.158. Surprisingly, SEScore2 even outperforms the supervised BLEURT and COMET on multiple text generation tasks.</abstract>
@@ -7899,7 +7899,7 @@
       <author><first>Wei</first><last>Shi</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ziquan</first><last>Fu</last><affiliation>System, Inc</affiliation></author>
       <author orcid="0000-0001-6332-5732"><first>Sijie</first><last>Cheng</last><affiliation>Fudan University</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yanghua</first><last>Xiao</last><affiliation>Fudan University</affiliation></author>
       <pages>9890-9908</pages>
       <abstract>Large language models (LLMs) have been widely studied for their ability to store and utilize positive knowledge. However, negative knowledge, such as “lions don’t live in the ocean”, is also ubiquitous in the world but rarely mentioned explicitly in text. What do LLMs know about negative knowledge?This work examines the ability of LLMs on negative commonsense knowledge. We design a constrained keywords-to-sentence generation task (CG) and a Boolean question answering task (QA) to probe LLMs.Our experiments reveal that LLMs frequently fail to generate valid sentences grounded in negative commonsense knowledge, yet they can correctly answer polar yes-or-no questions. We term this phenomenon the belief conflict of LLMs.Our further analysis shows that statistical shortcuts and negation reporting bias from language modeling pre-training cause this conflict.</abstract>
@@ -12505,7 +12505,7 @@
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Zhiguo</first><last>Yu</last><affiliation>Microsoft</affiliation></author>
       <author><first>Ming</first><last>Wu</last><affiliation>GitHub, Inc.</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>15590-15606</pages>
       <abstract>How can we extend a pre-trained model to many language understanding tasks, without labeled or additional unlabeled data? Pre-trained language models (PLMs) have been effective for a wide range of NLP tasks. However, existing approaches either require fine-tuning on downstream labeled datasets or manually constructing proper prompts. In this paper, we propose nonparametric prompting PLM (NPPrompt) for fully zero-shot language understanding. Unlike previous methods, NPPrompt uses only pre-trained language models and does not require any labeled data or additional raw corpus for further fine-tuning, nor does it rely on humans to construct a comprehensive set of prompt label words. We evaluate NPPrompt against previous major few-shot and zero-shot learning methods on diverse NLP tasks: including text classification, text entailment, similar text retrieval, paraphrasing, and multiple-choice question answering. Experimental results demonstrate that our NPPrompt outperforms the previous best fully zero-shot method by big margins, with absolute gains of 12.8% in accuracy on text classification and 15.6% on the GLUE benchmark. Our source code is available at <url>https://anonymous.4open.science/r/NPPrompt</url>.</abstract>
       <url hash="09d5815c">2023.acl-long.869</url>
diff --git a/data/xml/2023.findings.xml b/data/xml/2023.findings.xml
index b5af6bc1be..b67818d037 100644
--- a/data/xml/2023.findings.xml
+++ b/data/xml/2023.findings.xml
@@ -12344,7 +12344,7 @@
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
       <author><first>Wenhao</first><last>Zhu</last><affiliation>National Key Laboratory for Novel Software Technology, Nanjing University</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>The University of Hong Kong</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yu</first><last>Qiao</last><affiliation>Shanghai AI Lab</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last><affiliation>Shanghai AI Lab</affiliation></author>
       <pages>11518-11533</pages>
diff --git a/data/xml/2024.emnlp.xml b/data/xml/2024.emnlp.xml
index b71bb6a0e9..955132db1c 100644
--- a/data/xml/2024.emnlp.xml
+++ b/data/xml/2024.emnlp.xml
@@ -912,7 +912,7 @@
       <author><first>Zhiyong</first><last>Wu</last><affiliation>Shanghai Artificial Intelligence Laboratory</affiliation></author>
       <author><first>Baobao</first><last>Chang</last><affiliation>Peking University</affiliation></author>
       <author><first>Xu</first><last>Sun</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Zhifang</first><last>Sui</last><affiliation>Peking University</affiliation></author>
       <pages>1107-1128</pages>
       <abstract>With the increasing capabilities of large language models (LLMs), in-context learning (ICL) has emerged as a new paradigm for natural language processing (NLP), where LLMs make predictions based on contexts augmented with a few examples. It has been a significant trend to explore ICL to evaluate and extrapolate the ability of LLMs. In this paper, we aim to survey and summarize the progress and challenges of ICL. We first present a formal definition of ICL and clarify its correlation to related studies. Then, we organize and discuss advanced techniques, including training strategies, prompt designing strategies, and related analysis. Additionally, we explore various ICL application scenarios, such as data engineering and knowledge updating. Finally, we address the challenges of ICL and suggest potential directions for further research. We hope that our work can encourage more research on uncovering how ICL works and improving ICL.</abstract>
@@ -8701,7 +8701,7 @@
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Jiachen</first><last>Li</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>11125-11139</pages>
       <abstract>Direct alignment from preferences (DAP) has emerged as a promising paradigm for aligning large language models (LLMs) to human desiderata from pre-collected, offline preference datasets. While recent studies indicate that existing offline DAP methods can directly benefit from online training samples, we highlight the need to develop specific online DAP algorithms to fully harness the power of online training. Specifically, we identify that the learned LLM should adhere to the proximity of the behavior LLM, which collects the training samples. To this end, we propose online Preference Optimization in proximity to the Behavior LLM (BPO), emphasizing the importance of constructing a proper trust region for LLM alignment.We conduct extensive experiments to validate the effectiveness and applicability of our approach by integrating it with various DAP methods, resulting in significant performance improvements across a wide range of tasks when training with the same amount of preference data. Even when only introducing one additional data collection phase, our online BPO improves its offline DAP baseline from 72.0% to 80.2% on TL;DR and from 82.2% to 89.1% on Anthropic Helpfulness in terms of win rate against human reference text.</abstract>
       <url hash="7b9d4802">2024.emnlp-main.623</url>
@@ -10250,7 +10250,7 @@
       <author><first>Hanlin</first><last>Zhu</last><affiliation>Electrical Engineering &amp; Computer Science Department, University of California Berkeley</affiliation></author>
       <author><first>Xiaomeng</first><last>Yang</last><affiliation>Google DeepMind</affiliation></author>
       <author><first>Andrew</first><last>Cohen</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0003-4202-4847"><first>Yuandong</first><last>Tian</last><affiliation>Meta AI (FAIR)</affiliation></author>
       <pages>13274-13292</pages>
       <abstract>Recent research has increasingly focused on evaluating large language models’ (LLMs) alignment with diverse human values and preferences, particularly for open-ended tasks like story generation. Traditional evaluation metrics rely heavily on lexical similarity with human-written references, often showing poor correlation with human judgments and failing to account for alignment with the diversity of human preferences. To address these challenges, we introduce PerSE, an interpretable evaluation framework designed to assess alignment with specific human preferences. It is tuned to infer specific preferences from an in-context personal profile and evaluate the alignment between the generated content and personal preferences. PerSE enhances interpretability by providing detailed comments and fine-grained scoring, facilitating more personalized content generation. Our 13B LLaMA-2-based PerSE shows a 15.8% increase in Kendall correlation and a 13.7% rise in accuracy with zero-shot reviewers compared to GPT-4. It also outperforms GPT-4 by 46.01% in Kendall correlation on new domains, indicating its transferability</abstract>
@@ -18075,7 +18075,7 @@
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Xi</first><last>Xu</last></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>344-350</pages>
       <abstract>With the rapid advancement of machine translation research, evaluation toolkits have become essential for benchmarking system progress. Tools like COMET and SacreBLEU offer single quality score assessments that are effective for pairwise system comparisons. However, these tools provide limited insights for fine-grained system-level comparisons and the analysis of instance-level defects. To address these limitations, we introduce <b>Translation Canvas</b>, an explainable interface designed to pinpoint and analyze translation systems’ performance: 1) Translation Canvas assists machine translation researchers in comprehending system-level model performance by identifying common errors (their frequency and severity) and analyzing relationships between different systems based on various evaluation metrics. 2) It supports fine-grained analysis by highlighting error spans with explanations and selectively displaying systems’ predictions. According to human evaluation, Translation Canvas demonstrates superior performance over COMET and SacreBLEU packages under enjoybility and understandbility criteria.</abstract>
       <url hash="258613e4">2024.emnlp-demo.36</url>
diff --git a/data/xml/2024.findings.xml b/data/xml/2024.findings.xml
index 52ad9d01e8..9fddf83d10 100644
--- a/data/xml/2024.findings.xml
+++ b/data/xml/2024.findings.xml
@@ -15929,7 +15929,7 @@
       <author><first>Fei</first><last>Yuan</last></author>
       <author orcid="0000-0001-6730-5755"><first>Shuai</first><last>Yuan</last></author>
       <author><first>Zhiyong</first><last>Wu</last><affiliation>Shanghai Artificial Intelligence Laboratory</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>12111-12130</pages>
       <abstract>Large Language Models (LLMs), often show strong performance on English tasks, while exhibiting limitations on other languages. What is an LLM’s multilingual capability when it is trained only on certain languages? The underlying mechanism remains unclear. This study endeavors to examine the multilingual capability of LLMs from the vocabulary sharing perspective by conducting an exhaustive analysis across 101 languages. Through the investigation of the performance gap before and after embedding fine-tuning, we discovered four distinct quadrants. By delving into each quadrant we provide actionable and efficient guidelines for tuning these languages. Extensive experiments reveal that existing LLMs possess multilingual capabilities that surpass our expectations, and we can significantly improve the multilingual performance of LLMs based on these attributes of each quadrant .</abstract>
       <url hash="82a5134c">2024.findings-acl.721</url>
@@ -18707,7 +18707,7 @@
       <author><first>Zhenqiao</first><last>Song</last></author>
       <author orcid="0000-0002-7122-3493"><first>Taiqi</first><last>He</last></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>15654-15669</pages>
       <abstract>How can large language models (LLMs) process and translate endangered languages? Many languages lack a large corpus to train a decent LLM; therefore existing LLMs rarely perform well in unseen, endangered languages. On the contrary, we observe that 2000 endangered languages, though without a large corpus, have a grammar book or a dictionary. We propose LingoLLM, a training-free approach to enable an LLM to process unseen languages that hardly occur in its pre-training. Our key insight is to demonstrate linguistic knowledge of an unseen language in an LLM’s prompt, including a dictionary, a grammar book, and morphologically analyzed input text. We implement LingoLLM on top of two models, GPT-4 and Mixtral, and evaluate their performance on 5 tasks across 8 endangered or low-resource languages. Our results show that LingoLLM elevates translation capability from GPT-4’s 0 to 10.5 BLEU for 10 language directions. Our findings demonstrate the tremendous value of linguistic knowledge in the age of LLMs for endangered languages. Our data, code, and model generations will be released to the public. Our data, code, and model generations can be found at <url>https://github.com/LLiLab/llm4endangeredlang</url>.</abstract>
       <url hash="49f5a574">2024.findings-acl.925</url>
@@ -19577,7 +19577,7 @@
       <author><first>Babak</first><last>Damavandi</last></author>
       <author orcid="0009-0001-2049-2458"><first>Xin Luna</first><last>Dong</last><affiliation>Facebook</affiliation></author>
       <author orcid="0000-0003-2996-9790"><first>Christos</first><last>Faloutsos</last><affiliation>Amazon and Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Seungwhan</first><last>Moon</last><affiliation>Facebook</affiliation></author>
       <pages>247-266</pages>
       <abstract>Vision-extended LLMs have made significant strides in Visual Question Answering (VQA). Despite these advancements, VLLMs still encounter substantial difficulties in handling queries involving long-tail entities, with a tendency to produce erroneous or hallucinated responses. In this work, we introduce a novel evaluative benchmark named <b>SnapNTell</b>, specifically tailored for entity-centric VQA. This task aims to test the models’ capabilities in identifying entities and providing detailed, entity-specific knowledge. We have developed the <b>SnapNTell Dataset</b>, distinct from traditional VQA datasets: (1) It encompasses a wide range of categorized entities, each represented by images and explicitly named in the answers; (2) It features QA pairs that require extensive knowledge for accurate responses. The dataset is organized into 22 major categories, containing 7,568 unique entities in total. For each entity, we curated 10 illustrative images and crafted 10 knowledge-intensive QA pairs. To address this novel task, we devised a scalable, efficient, and transparent retrieval-augmented multimodal LLM. Our approach markedly outperforms existing methods on the SnapNTell dataset, achieving a 66.5% improvement in the BELURT score.</abstract>
@@ -24567,7 +24567,7 @@ and high variation in performance on the subset, suggesting our plausibility cri
       <author orcid="0000-0002-8105-7986"><first>João DS</first><last>Marques</last><affiliation>Instituto Superior Técnico and INESC-ID</affiliation></author>
       <author><first>Miguel</first><last>Graça</last></author>
       <author><first>Miguel</first><last>Freire</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0001-8638-5594"><first>Arlindo L.</first><last>Oliveira</last></author>
       <pages>6473-6486</pages>
       <abstract>Modern NLP tasks increasingly rely on dense retrieval methods to access up-to-date and relevant contextual information. We are motivated by the premise that retrieval benefits from segments that can vary in size such that a content’s semantic independence is better captured. We propose LumberChunker, a method leveraging an LLM to dynamically segment documents, which iteratively prompts the LLM to identify the point within a group of sequential passages where the content begins to shift. To evaluate our method, we introduce GutenQA, a benchmark with 3000 “needle in a haystack” type of question-answer pairs derived from 100 public domain narrative books available on Project Gutenberg. Our experiments show that LumberChunker not only outperforms the most competitive baseline by 7.37% in retrieval performance (DCG@20) but also that, when integrated into a RAG pipeline, LumberChunker proves to be more effective than other chunking methods and competitive baselines, such as the Gemini 1.5M Pro.</abstract>
@@ -28060,7 +28060,7 @@ and high variation in performance on the subset, suggesting our plausibility cri
       <title><fixed-case>LL</fixed-case>a<fixed-case>MAX</fixed-case>: Scaling Linguistic Horizons of <fixed-case>LLM</fixed-case> by Enhancing Translation Capabilities Beyond 100 Languages</title>
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
       <author><first>Wenhao</first><last>Zhu</last><affiliation>Nanjing University</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0002-1889-2567"><first>Yu</first><last>Qiao</last></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <pages>10748-10772</pages>
diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index 785a06210b..0e9d3ba73e 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -4615,7 +4615,7 @@
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
       <author><first>Chenwen</first><last>Liao</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last><affiliation>University of California, San Diego</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>6304-6316</pages>
       <abstract>Text watermarks in large language models (LLMs) are increasingly used to detect synthetic text, mitigating misuse cases like fake news and academic dishonesty. While existing watermarking detection techniques primarily focus on classifying entire documents as watermarked or not, they often neglect the common scenario of identifying individual watermark segments within longer, mixed-source documents. Drawing inspiration from plagiarism detection systems, we propose two novel methods for partial watermark detection. First, we develop a geometry cover detection framework aimed at determining whether there is a watermark segment in long text. Second, we introduce an adaptive online learning algorithm to pinpoint the precise location of watermark segments within the text. Evaluated on three popular watermarking techniques (KGW-Watermark, Unigram-Watermark, and Gumbel-Watermark), our approach achieves high accuracy, significantly outperforming baseline methods. Moreover, our framework is adaptable to other watermarking techniques, offering new insights for precise watermark detection. Our code is publicly available at <url>https://github.com/XuandongZhao/llm-watermark-location</url>.</abstract>
       <url hash="9643033f">2025.acl-long.316</url>
diff --git a/data/xml/2025.emnlp.xml b/data/xml/2025.emnlp.xml
index d91a31816c..bf6c5000fe 100644
--- a/data/xml/2025.emnlp.xml
+++ b/data/xml/2025.emnlp.xml
@@ -25167,7 +25167,7 @@
       <author><first>Adam</first><last>Officer</last><affiliation>University of Pittsburgh Medical Center</affiliation></author>
       <author><first>Angela</first><last>Chen</last></author>
       <author><first>Yufei</first><last>Huang</last><affiliation>University of Pittsburgh</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>480-486</pages>
       <abstract>Comprehensive pathway datasets are essential resources for advancing biological research, yet constructing these datasets is labor intensive. Recognizing the labor-intensive nature of constructing these critical resources, we present BioGraphia, a web-based annotation platform designed to facilitate collaborative pathway graph annotation. BioGraphia supports multi-user collaboration with real-time monitoring, curation, and interactive pathway graph visualization. It enables users to directly annotate the nodes and relations on the candidate graph, guided by detailed instructions. The platform is further enhanced with a large language model that automatically generates explainable and span-aligned pre-annotation to accelerate the annotation process. Its modular design allows flexible integration of external knowledge bases, and customization of the definition of annotation schema and, to support adaptation to other graph-based annotation tasks. Code is available at <url>https://github.com/LeiLiLab/BioGraphia</url></abstract>
       <url hash="9e6b29ab">2025.emnlp-demos.34</url>
diff --git a/data/xml/2025.findings.xml b/data/xml/2025.findings.xml
index 4538d945e4..7d74c6c282 100644
--- a/data/xml/2025.findings.xml
+++ b/data/xml/2025.findings.xml
@@ -3679,7 +3679,7 @@
       <title>A Practical Examination of <fixed-case>AI</fixed-case>-Generated Text Detectors for Large Language Models</title>
       <author><first>Brian</first><last>Tufts</last></author>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>4824-4841</pages>
       <abstract>The proliferation of large language models has raised growing concerns about their misuse, particularly in cases where AI-generated text is falsely attributed to human authors. Machine-generated content detectors claim to effectively identify such text under various conditions and from any language model. This paper critically evaluates these claims by assessing several popular detectors (RADAR, Wild, T5Sentinel, Fast-DetectGPT, PHD, LogRank, Binoculars) on a range of domains, datasets, and models that these detectors have not previously encountered. We employ various prompting strategies to simulate practical adversarial attacks, demonstrating that even moderate efforts can significantly evade detection. We emphasize the importance of the true positive rate at a specific false positive rate (TPR@FPR) metric and demonstrate that these detectors perform poorly in certain settings, with TPR@.01 as low as 0%. Our findings suggest that both trained and zero-shot detectors struggle to maintain high sensitivity while achieving a reasonable true positive rate.</abstract>
       <url hash="6ae6fd80">2025.findings-naacl.271</url>
@@ -5290,7 +5290,7 @@
       <author><first>Xi</first><last>Xu</last></author>
       <author><first>Wenda</first><last>Xu</last></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>7062-7067</pages>
       <abstract>Simultaneous speech translation (SimulST) systems must balance translation quality with response time, making latency measurement crucial for evaluating their real-world performance. However, there has been a longstanding belief that current metrics yield unrealistically high latency measurements in unsegmented streaming settings. In this paper, we investigate this phenomenon, revealing its root cause in a fundamental misconception underlying existing latency evaluation approaches. We demonstrate that this issue affects not only streaming but also segment-level latency evaluation across different metrics. Furthermore, we propose a modification to correctly measure computation-aware latency for SimulST systems, addressing the limitations present in existing metrics.</abstract>
       <url hash="14a7f1e4">2025.findings-naacl.393</url>
@@ -8591,7 +8591,7 @@
       <title><fixed-case>I</fixed-case>nfini<fixed-case>SST</fixed-case>: Simultaneous Translation of Unbounded Speech with Large Language Model</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
       <author><first>Xi</first><last>Xu</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>3032-3046</pages>
       <abstract>Simultaneous translation of unbounded streaming speech remains a challenging problem due to the need for effectively processing the historical speech context and past translations so that quality and latency, including computation overhead, can be balanced. Most prior works assume pre-segmented speech, limiting their real-world applicability. In this paper, we propose InfiniSST, a novel approach that formulates SST as a multi-turn dialogue task, enabling seamless translation of unbounded speech. We construct translation trajectories and robust segments from MuST-C with multi-latency augmentation during training and develop a key-value (KV) cache management strategy to facilitate efficient inference. Experiments on MuST-C En-Es, En-De, and En-Zh demonstrate that InfiniSST reduces computation-aware latency by 0.5 to 1 second while maintaining the same translation quality compared to baselines. Ablation studies further validate the contributions of our data construction and cache management strategy. Code is released at https://github.com/LeiLiLab/InfiniSST.</abstract>
       <url hash="098c0c79">2025.findings-acl.157</url>
@@ -23213,7 +23213,7 @@
       <title><fixed-case>L</fixed-case>ego<fixed-case>MT</fixed-case>2: Selective Asynchronous Sharded Data Parallel Training for Massive Neural Machine Translation</title>
       <author><first>Fei</first><last>Yuan</last></author>
       <author><first>Yinquan</first><last>Lu</last><affiliation>Shanghai AI Laboratory</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <pages>23359-23376</pages>
       <abstract>It is a critical challenge to learn a single model for massive languages. Prior methods focus on increasing the model size and training data size. However, large models are difficult to optimize efficiently even with distributed parallel training and translation capacity can interfere among languages. To address the challenge, we propose LegoMT2, an efficient training approach with an asymmetric multi-way model architecture for massive multilingual neural machine translation. LegoMT2 shards 435 languages into 8 language-centric groups and attributes one local encoder for each group’s languages and a mix encoder-decoder for all languages. LegoMT2 trains the model through local data parallel and asynchronous distributed updating of parameters. LegoMT2 is 16.2<tex-math>\times</tex-math> faster than the distributed training method for M2M-100-12B (which only for 100 languages) while improving the translation performance by an average of 2.2 BLEU on <i>Flores-101</i>, especially performing better for low-resource languages .</abstract>
@@ -38256,7 +38256,7 @@
       <author><first>Wenhao</first><last>Zhu</last><affiliation>ByteDance Inc.</affiliation></author>
       <author><first>Hanxu</first><last>Hu</last><affiliation>Microsoft Research</affiliation></author>
       <author orcid="0000-0001-8697-695X"><first>Conghui</first><last>He</last><affiliation>Shanghai AI Lab</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0003-4869-0832"><first>Shujian</first><last>Huang</last><affiliation>Nanjing University</affiliation></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <pages>16751-16774</pages>
diff --git a/data/xml/2025.naacl.xml b/data/xml/2025.naacl.xml
index 1a63346744..793f627f0c 100644
--- a/data/xml/2025.naacl.xml
+++ b/data/xml/2025.naacl.xml
@@ -1282,7 +1282,7 @@
       <author orcid="0000-0001-8161-6429"><first>Siyu</first><last>Yuan</last></author>
       <author><first>Kai</first><last>Zhang</last></author>
       <author><first>Yikai</first><last>Zhang</last></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author orcid="0000-0001-8403-9591"><first>Yanghua</first><last>Xiao</last><affiliation>Fudan University</affiliation></author>
       <pages>1872-1888</pages>
       <abstract>Autonomous planning has been an ongoing pursuit since the inception of artificial intelligence. Based on curated problem solvers, early planning agents could deliver precise solutions for specific tasks but lacked generalization. The emergence of large language models (LLMs) and their powerful reasoning capabilities has reignited interest in autonomous planning by automatically generating reasonable solutions for given tasks. However, prior research and our experiments show that current language agents still lack human-level planning abilities. Even the state-of-the-art reasoning model, OpenAI o1, achieves only 15.6% on one of the complex real-world planning benchmarks. This highlights a critical question: What hinders language agents from achieving human-level planning? Although existing studies have highlighted weak performance in agent planning, the deeper underlying issues and the mechanisms and limitations of the strategies proposed to address them remain insufficiently understood. In this work, we apply the feature attribution study and identify two key factors that hinder agent planning: the limited role of constraints and the diminishing influence of questions. We also find that although current strategies help mitigate these challenges, they do not fully resolve them, indicating that agents still have a long way to go before reaching human-level intelligence.</abstract>
@@ -3938,7 +3938,7 @@
       <author><first>Zhehuai</first><last>Chen</last></author>
       <author><first>Vitaly</first><last>Lavrukhin</last><affiliation>NVIDIA</affiliation></author>
       <author><first>Jagadeesh</first><last>Balam</last><affiliation>NVIDIA</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Boris</first><last>Ginsburg</last><affiliation>NVIDIA</affiliation></author>
       <pages>5547-5557</pages>
       <abstract>Simultaneous machine translation (SMT) takes streaming input utterances and incrementally produces target text. Existing SMT methods only use the partial utterance that has already arrived at the input and the generated hypothesis. Motivated by human interpreters’ technique to forecast future words before hearing them, we propose Translation by Anticipating Future (TAF), a method to improve translation quality while retaining low latency. Its core idea is to use a large language model (LLM) to predict future source words and opportunistically translate without introducing too much risk. We evaluate our TAF and multiple baselines of SMT on four language directions. Experiments show that TAF achieves the best translation quality-latency trade-off and outperforms the baselines by up to 5 BLEU points at the same latency (three words).</abstract>
@@ -5567,7 +5567,7 @@
       <author><first>Shang</first><last>Zhou</last></author>
       <author><first>Danqing</first><last>Wang</last><affiliation>CMU, Carnegie Mellon University</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>7959-7973</pages>
       <abstract>Sampling is a basic operation for large language models (LLMs). In reinforcement learning rollouts and meta generation algorithms such as Best-of-N, it is essential to sample correct trajectories within a given compute budget. To find an optimal allocation for sample compute budgets, several choices need to be made:Which sampling configurations (model, temperature, language, etc.) to use?How many samples to generate in each configuration?We formulate these choices as a learning problem and propose OSCA, an algorithm that Optimizes Sample Compute Allocation by finding an optimal mix of different inference configurations.Our experiments show that with our learned mixed allocation, we can achieve accuracy better than the best single configuration with 128x less compute on code generation and 25x less compute on 4 reasoning tasks.is also shown to be effective in agentic workflows beyond single-turn tasks, achieving a better accuracy on SWE-Bench with 3x less compute than the default configuration.Our code and generations are released at https://github.com/LeiLiLab/OSCA.</abstract>
       <url hash="e548881c">2025.naacl-long.404</url>
@@ -6287,7 +6287,7 @@
       <author><first>Chang</first><last>Ma</last></author>
       <author orcid="0000-0001-6730-5755"><first>Shuai</first><last>Yuan</last></author>
       <author orcid="0000-0002-5207-818X"><first>Qiushi</first><last>Sun</last><affiliation>University of Hong Kong</affiliation></author>
-      <author orcid="0000-0003-3095-9776" id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author orcid="0000-0003-3095-9776" id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>9077-9090</pages>
       <abstract>The lottery ticket hypothesis posits the existence of “winning tickets” within a randomly initialized neural network. Do winning tickets exist for LLMs in fine-tuning scenarios? How can we find such winning tickets? In this paper, we propose KS-Lottery, a method to identify a small subset of LLM parameters highly effective in multilingual fine-tuning. Our key idea is to use Kolmogorov-Smirnov Test to analyze the distribution shift of parameters before and after fine-tuning. We further theoretically prove that KS-Lottery can find the certified winning tickets in the embedding layer, fine-tuning on the found parameters is guaranteed to perform as well as full fine-tuning. Comparing KS-Lottery with other tuning algorithms on translation tasks, the experimental results show that KS-Lottery finds a much smaller set of parameters for fine-tuning while achieving the comparable performance as full fine-tuning LLM. Surprisingly, we find that fine-tuning 18 tokens’ embedding of LLaMA suffices to reach the fine-tuning translation performance .</abstract>
       <url hash="416c92fd">2025.naacl-long.458</url>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 07a967d937..1b604107b4 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5741,6 +5741,11 @@
 - canonical: {first: Lei, last: Li}
   id: lei-li
   comment: May refer to several people
+- canonical: {first: Lei, last: Li}
+  id: lei-li-cmu
+  orcid: 0000-0003-3095-9776
+  comment: Carnegie Mellon University
+  institution: Carnegie Mellon University
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 7afd769fdc5a2d490a0d6ea0cdddf24afa1b414a Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Thu, 6 Nov 2025 22:59:27 +0100
Subject: [PATCH 03/19] Add Lei Li (HKU) and edit id for all orcid-tagged
 papers

- add Lei Li (University of Hong Kong) as a person including orcid (ending in `-5104`) and institution of degree
- change id for all papers with this orcid away from the catch-all to the specific `lei-li-hku`
---
 data/xml/2024.emnlp.xml      | 4 ++--
 data/xml/2024.findings.xml   | 4 ++--
 data/xml/2025.acl.xml        | 4 ++--
 data/xml/2025.emnlp.xml      | 4 ++--
 data/xml/2025.naacl.xml      | 2 +-
 data/yaml/name_variants.yaml | 5 +++++
 6 files changed, 14 insertions(+), 9 deletions(-)

diff --git a/data/xml/2024.emnlp.xml b/data/xml/2024.emnlp.xml
index 955132db1c..92ce3743bb 100644
--- a/data/xml/2024.emnlp.xml
+++ b/data/xml/2024.emnlp.xml
@@ -902,7 +902,7 @@
     <paper id="64">
       <title>A Survey on In-context Learning</title>
       <author><first>Qingxiu</first><last>Dong</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Ce</first><last>Zheng</last><affiliation>Peking University</affiliation></author>
       <author><first>Jingyuan</first><last>Ma</last></author>
@@ -5036,7 +5036,7 @@
     </paper>
     <paper id="358">
       <title><fixed-case>VLF</fixed-case>eedback: A Large-Scale <fixed-case>AI</fixed-case> Feedback Dataset for Large Vision-Language Models Alignment</title>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Zhihui</first><last>Xie</last><affiliation>Shanghai Jiao Tong University</affiliation></author>
       <author><first>Mukai</first><last>Li</last></author>
       <author><first>Shunian</first><last>Chen</last><affiliation>Shenzhen Research Institute of Big Data</affiliation></author>
diff --git a/data/xml/2024.findings.xml b/data/xml/2024.findings.xml
index 9fddf83d10..2b12bb3577 100644
--- a/data/xml/2024.findings.xml
+++ b/data/xml/2024.findings.xml
@@ -8815,7 +8815,7 @@
     <paper id="198">
       <title>Red Teaming Visual Language Models</title>
       <author><first>Mukai</first><last>Li</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0002-5022-6468"><first>Yuwei</first><last>Yin</last></author>
       <author><first>Masood</first><last>Ahmed</last></author>
       <author><first>Zhenguang</first><last>Liu</last><affiliation>Zhejiang University</affiliation></author>
@@ -13143,7 +13143,7 @@
       <author><first>Yi</first><last>Liu</last><affiliation>Peking University</affiliation></author>
       <author><first>Yuxiang</first><last>Wang</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Sishuo</first><last>Chen</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Xu</first><last>Sun</last></author>
       <author><first>Lu</first><last>Hou</last><affiliation>Huawei Technologies Ltd.</affiliation></author>
diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index 0e9d3ba73e..f8b0c3ebc7 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -19239,7 +19239,7 @@
       <title>Benchmarking Long-Context Language Models on Long Code Understanding</title>
       <author><first>Jia</first><last>Li</last></author>
       <author><first>Xuyuan</first><last>Guo</last><affiliation>Peking University</affiliation></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Kechi</first><last>Zhang</last><affiliation>Peking University</affiliation></author>
       <author><first>Ge</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0002-5579-8852"><first>Jia</first><last>Li</last><affiliation>Tsinghua University</affiliation></author>
@@ -23304,7 +23304,7 @@
     <paper id="1603">
       <title>Design Choices for Extending the Context Length of Visual Language Models</title>
       <author><first>Mukai</first><last>Li</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0001-5028-2323"><first>Shansan</first><last>Gong</last></author>
       <author orcid="0000-0003-4608-5778"><first>Qi</first><last>Liu</last><affiliation>University of Hong Kong</affiliation></author>
       <pages>33425-33438</pages>
diff --git a/data/xml/2025.emnlp.xml b/data/xml/2025.emnlp.xml
index bf6c5000fe..6a1a3cc5ae 100644
--- a/data/xml/2025.emnlp.xml
+++ b/data/xml/2025.emnlp.xml
@@ -22082,7 +22082,7 @@
       <author orcid="0009-0007-1607-2948"><first>Sheng</first><last>Wang</last></author>
       <author><first>Jingwei</first><last>Dong</last><affiliation>the University of Hong Kong</affiliation></author>
       <author><first>Kai</first><last>Liu</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Jiahui</first><last>Gao</last></author>
       <author><first>Jiyue</first><last>Jiang</last></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
@@ -23892,7 +23892,7 @@
       <author><first>Xiaonan</first><last>Li</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ming</first><last>Zhong</last><affiliation>University of Illinois Urbana Champaign</affiliation></author>
       <author orcid="0000-0001-5028-2323"><first>Shansan</first><last>Gong</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0002-3152-5091"><first>Jun</first><last>Zhang</last><affiliation>ByteDance</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
diff --git a/data/xml/2025.naacl.xml b/data/xml/2025.naacl.xml
index 793f627f0c..62936b7d90 100644
--- a/data/xml/2025.naacl.xml
+++ b/data/xml/2025.naacl.xml
@@ -4961,7 +4961,7 @@
       <title><fixed-case>I</fixed-case>mg<fixed-case>T</fixed-case>rojan: Jailbreaking Vision-Language Models with <fixed-case>ONE</fixed-case> Image</title>
       <author><first>Xijia</first><last>Tao</last></author>
       <author><first>Shuai</first><last>Zhong</last></author>
-      <author orcid="0009-0008-6984-5104" id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author orcid="0009-0008-6984-5104" id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author orcid="0000-0003-4608-5778"><first>Qi</first><last>Liu</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
       <pages>7048-7063</pages>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 1b604107b4..c70af33eef 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5746,6 +5746,11 @@
   orcid: 0000-0003-3095-9776
   comment: Carnegie Mellon University
   institution: Carnegie Mellon University
+- canonical: {first: Lei, last: Li}
+  id: lei-li-hku
+  orcid: 0009-0008-6984-5104
+  comment: University of Hong Kong
+  institution: University of Hong Kong
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 4535c91d2a71a0fc040f07b5b1e1d2beaeed8149 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 01:47:01 +0100
Subject: [PATCH 04/19] bsed on works in orcid.org add more entries to
 `lei-li-hku/cmu`

though one case strange: 2024 emnlp of hku was listed on cmu orcid site
---
 data/xml/2020.acl.xml      |  4 ++--
 data/xml/2020.emnlp.xml    |  6 +++---
 data/xml/2020.findings.xml |  4 ++--
 data/xml/2020.wmt.xml      |  4 ++--
 data/xml/2021.acl.xml      | 14 +++++++-------
 data/xml/2021.eacl.xml     |  2 +-
 data/xml/2021.emnlp.xml    |  6 +++---
 data/xml/2021.findings.xml | 12 ++++++------
 data/xml/2021.iwslt.xml    |  2 +-
 data/xml/2021.naacl.xml    |  8 ++++----
 data/xml/2021.wmt.xml      |  2 +-
 data/xml/2022.findings.xml |  6 +++---
 data/xml/2022.iwslt.xml    |  2 +-
 data/xml/2023.emnlp.xml    |  4 ++--
 data/xml/2023.findings.xml |  4 ++--
 data/xml/2024.acl.xml      |  2 +-
 data/xml/2024.findings.xml |  4 ++--
 data/xml/2024.iwslt.xml    |  4 ++--
 data/xml/2025.coling.xml   |  2 +-
 data/xml/2025.iwslt.xml    |  2 +-
 data/xml/D18.xml           |  2 +-
 data/xml/D19.xml           |  4 ++--
 data/xml/N18.xml           |  2 +-
 data/xml/P16.xml           |  2 +-
 data/xml/P19.xml           | 12 ++++++------
 data/xml/W19.xml           |  2 +-
 26 files changed, 59 insertions(+), 59 deletions(-)

diff --git a/data/xml/2020.acl.xml b/data/xml/2020.acl.xml
index 3918997eda..7b0399e1a1 100644
--- a/data/xml/2020.acl.xml
+++ b/data/xml/2020.acl.xml
@@ -4234,7 +4234,7 @@
       <author><first>Ning</first><last>Miao</last></author>
       <author><first>Yuxuan</first><last>Song</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>3436–3441</pages>
       <abstract>It has been a common approach to pre-train a language model on a large corpus and fine-tune it on task-specific data. In practice, we observe that fine-tuning a pre-trained model on a small dataset may lead to over- and/or under-estimate problem. In this paper, we propose MC-Tailor, a novel method to alleviate the above issue in text generation tasks by truncating and transferring the probability mass from over-estimated regions to under-estimated ones. Experiments on a variety of text generation datasets show that MC-Tailor consistently and significantly outperforms the fine-tuning approach.</abstract>
       <url hash="5c7e1235">2020.acl-main.314</url>
@@ -10481,7 +10481,7 @@
       <author><first>Xijin</first><last>Zhang</last></author>
       <author><first>Songcheng</first><last>Jiang</last></author>
       <author><first>Yuxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>1–8</pages>
       <abstract>This paper proposes the building of Xiaomingbot, an intelligent, multilingual and multimodal software robot equipped with four inte- gral capabilities: news generation, news translation, news reading and avatar animation. Its system summarizes Chinese news that it automatically generates from data tables. Next, it translates the summary or the full article into multiple languages, and reads the multi- lingual rendition through synthesized speech. Notably, Xiaomingbot utilizes a voice cloning technology to synthesize the speech trained from a real person’s voice data in one input language. The proposed system enjoys several merits: it has an animated avatar, and is able to generate and read multilingual news. Since it was put into practice, Xiaomingbot has written over 600,000 articles, and gained over 150,000 followers on social media platforms.</abstract>
       <url hash="a9a9e7e8">2020.acl-demos.1</url>
diff --git a/data/xml/2020.emnlp.xml b/data/xml/2020.emnlp.xml
index 74ace32d5f..55e6af0b21 100644
--- a/data/xml/2020.emnlp.xml
+++ b/data/xml/2020.emnlp.xml
@@ -1707,7 +1707,7 @@
       <author><first>Shuang</first><last>Zeng</last></author>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>1630–1640</pages>
       <abstract>Document-level relation extraction aims to extract relations among entities within a document. Different from sentence-level relation extraction, it requires reasoning over multiple sentences across paragraphs. In this paper, we propose Graph Aggregation-and-Inference Network (GAIN), a method to recognize such relations for long paragraphs. GAIN constructs two graphs, a heterogeneous mention-level graph (MG) and an entity-level graph (EG). The former captures complex interaction among different mentions and the latter aggregates mentions underlying for the same entities. Based on the graphs we propose a novel path reasoning mechanism to infer relations between entities. Experiments on the public dataset, DocRED, show GAIN achieves a significant performance improvement (2.85 on F1) over the previous state-of-the-art. Our code is available at <url>https://github.com/PKUnlp-icler/GAIN</url>.</abstract>
       <url hash="f205ef83">2020.emnlp-main.127</url>
@@ -2836,7 +2836,7 @@
       <author><first>Xipeng</first><last>Qiu</last></author>
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2649–2663</pages>
       <abstract>We investigate the following question for machine translation (MT): can we develop a single universal MT model to serve as the common seed and obtain derivative and improved models on arbitrary language pairs? We propose mRASP, an approach to pre-train a universal multilingual neural machine translation model. Our key idea in mRASP is its novel technique of random aligned substitution, which brings words and phrases with similar meanings across multiple languages closer in the representation space. We pre-train a mRASP model on 32 language pairs jointly with only public datasets. The model is then fine-tuned on downstream language pairs to obtain specialized MT models. We carry out extensive experiments on 42 translation directions across a diverse settings, including low, medium, rich resource, and as well as transferring to exotic language pairs. Experimental results demonstrate that mRASP achieves significant performance improvement compared to directly training on those target pairs. It is the first time to verify that multiple lowresource language pairs can be utilized to improve rich resource MT. Surprisingly, mRASP is even able to improve the translation quality on exotic languages that never occur in the pretraining corpus. Code, data, and pre-trained models are available at <url>https://github.com/linzehui/mRASP</url>.</abstract>
       <url hash="a0f25581">2020.emnlp-main.210</url>
@@ -9842,7 +9842,7 @@
       <author><first>Junxian</first><last>He</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Yiming</first><last>Yang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>9119–9130</pages>
       <abstract>Pre-trained contextual representations like BERT have achieved great success in natural language processing. However, the sentence embeddings from the pre-trained language models without fine-tuning have been found to poorly capture semantic meaning of sentences. In this paper, we argue that the semantic information in the BERT embeddings is not fully exploited. We first reveal the theoretical connection between the masked language model pre-training objective and the semantic similarity task theoretically, and then analyze the BERT sentence embeddings empirically. We find that BERT always induces a non-smooth anisotropic semantic space of sentences, which harms its performance of semantic similarity. To address this issue, we propose to transform the anisotropic sentence embedding distribution to a smooth and isotropic Gaussian distribution through normalizing flows that are learned with an unsupervised objective. Experimental results show that our proposed BERT-flow method obtains significant performance gains over the state-of-the-art sentence embeddings on a variety of semantic textual similarity tasks. The code is available at <url>https://github.com/bohanli/BERT-flow</url>.</abstract>
       <url hash="b156fa71">2020.emnlp-main.733</url>
diff --git a/data/xml/2020.findings.xml b/data/xml/2020.findings.xml
index 28c4cdd206..63b5c7021e 100644
--- a/data/xml/2020.findings.xml
+++ b/data/xml/2020.findings.xml
@@ -1465,7 +1465,7 @@
       <title>Language Generation via Combinatorial Constraint Satisfaction: A Tree Search Enhanced <fixed-case>M</fixed-case>onte-<fixed-case>C</fixed-case>arlo Approach</title>
       <author><first>Maosen</first><last>Zhang</last></author>
       <author><first>Nan</first><last>Jiang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Yexiang</first><last>Xue</last></author>
       <pages>1286–1298</pages>
       <abstract>Generating natural language under complex constraints is a principled formulation towards controllable text generation. We present a framework to allow specification of combinatorial constraints for sentence generation. We propose TSMC, an efficient method to generate high likelihood sentences with respect to a pre-trained language model while satisfying the constraints. Our approach is highly flexible, requires no task-specific train- ing, and leverages efficient constraint satisfaction solving techniques. To better handle the combinatorial constraints, a tree search algorithm is embedded into the proposal process of the Markov Chain Monte Carlo (MCMC) to explore candidates that satisfy more constraints. Compared to existing MCMC approaches, our sampling approach has a better mixing performance. Experiments show that TSMC achieves consistent and significant improvement on multiple language generation tasks.</abstract>
@@ -5726,7 +5726,7 @@
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>4908–4917</pages>
       <abstract>Active learning for sentence understanding aims at discovering informative unlabeled data for annotation and therefore reducing the demand for labeled data. We argue that the typical uncertainty sampling method for active learning is time-consuming and can hardly work in real-time, which may lead to ineffective sample selection. We propose adversarial uncertainty sampling in discrete space (AUSDS) to retrieve informative unlabeled samples more efficiently. AUSDS maps sentences into latent space generated by the popular pre-trained language models, and discover informative unlabeled text samples for annotation via adversarial attack. The proposed approach is extremely efficient compared with traditional uncertainty sampling with more than 10x speedup. Experimental results on five datasets show that AUSDS outperforms strong baselines on effectiveness.</abstract>
       <url hash="a49de01f">2020.findings-emnlp.441</url>
diff --git a/data/xml/2020.wmt.xml b/data/xml/2020.wmt.xml
index 56f716fc66..c516c6e1fe 100644
--- a/data/xml/2020.wmt.xml
+++ b/data/xml/2020.wmt.xml
@@ -471,7 +471,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Yaoming</first><last>Zhu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>305–312</pages>
       <abstract>This paper describes our submission systems for VolcTrans for WMT20 shared news translation task. We participated in 8 translation directions. Our basic systems are based on Transformer (CITATION), into which we also employed new architectures (bigger or deeper Transformers, dynamic convolution). The final systems include text pre-process, subword(a.k.a. BPE(CITATION)), baseline model training, iterative back-translation, model ensemble, knowledge distillation and multilingual pre-training.</abstract>
       <url hash="58264a1d">2020.wmt-1.33</url>
@@ -1443,7 +1443,7 @@
       <author><first>Zhuo</first><last>Zhi</last></author>
       <author><first>Jun</first><last>Cao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>985–990</pages>
       <abstract>In this paper, we describe our submissions to the WMT20 shared task on parallel corpus filtering and alignment for low-resource conditions. The task requires the participants to align potential parallel sentence pairs out of the given document pairs, and score them so that low-quality pairs can be filtered. Our system, Volctrans, is made of two modules, i.e., a mining module and a scoring module. Based on the word alignment model, the mining mod- ule adopts an iterative mining strategy to extract latent parallel sentences. In the scoring module, an XLM-based scorer provides scores, followed by reranking mechanisms and ensemble. Our submissions outperform the baseline by 3.x/2.x and 2.x/2.x for km-en and ps-en on From Scratch/Fine-Tune conditions.</abstract>
       <url hash="98a59e41">2020.wmt-1.112</url>
diff --git a/data/xml/2021.acl.xml b/data/xml/2021.acl.xml
index c2467d6434..a0b841b9de 100644
--- a/data/xml/2021.acl.xml
+++ b/data/xml/2021.acl.xml
@@ -284,7 +284,7 @@
       <author><first>Changzhi</first><last>Sun</last></author>
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Junchi</first><last>Yan</last></author>
       <pages>220–231</pages>
       <abstract>Many joint entity relation extraction models setup two separated label spaces for the two sub-tasks (i.e., entity detection and relation classification). We argue that this setting may hinder the information interaction between entities and relations. In this work, we propose to eliminate the different treatment on the two sub-tasks’ label spaces. The input of our model is a table containing all word pairs from a sentence. Entities and relations are represented by squares and rectangles in the table. We apply a unified classifier to predict each cell’s label, which unifies the learning of two sub-tasks. For testing, an effective (yet fast) approximate decoder is proposed for finding squares and rectangles from tables. Experiments on three benchmarks (ACE04, ACE05, SciERC) show that, using only half the number of parameters, our model achieves competitive accuracy with the best extractor, and is faster.</abstract>
@@ -315,7 +315,7 @@
       <author><first>Xiao</first><last>Pan</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Liwei</first><last>Wu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>244–258</pages>
       <abstract>Existing multilingual machine translation approaches mainly focus on English-centric directions, while the non-English directions still lag behind. In this work, we aim to build a many-to-many translation system with an emphasis on the quality of non-English language directions. Our intuition is based on the hypothesis that a universal cross-language representation leads to better multilingual translation performance. To this end, we propose mRASP2, a training method to obtain a single unified multilingual translation model. mRASP2 is empowered by two techniques: a) a contrastive learning scheme to close the gap among representations of different languages, and b) data augmentation on both multiple parallel and monolingual data to further align token representations. For English-centric directions, mRASP2 achieves competitive or even better performance than a strong pre-trained model mBART on tens of WMT benchmarks. For non-English directions, mRASP2 achieves an improvement of average 10+ BLEU compared with the multilingual baseline</abstract>
       <url hash="359e1df2">2021.acl-long.21</url>
@@ -364,7 +364,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Liwei</first><last>Wu</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>293–305</pages>
       <abstract>Multilingual neural machine translation aims at learning a single translation model for multiple languages. These jointly trained models often suffer from performance degradationon rich-resource language pairs. We attribute this degeneration to parameter interference. In this paper, we propose LaSS to jointly train a single unified multilingual MT model. LaSS learns Language Specific Sub-network (LaSS) for each language pair to counter parameter interference. Comprehensive experiments on IWSLT and WMT datasets with various Transformer architectures show that LaSS obtains gains on 36 language pairs by up to 1.2 BLEU. Besides, LaSS shows its strong generalization performance at easy adaptation to new language pairs and zero-shot translation. LaSS boosts zero-shot translation with an average of 8.3 BLEU on 30 language pairs. Codes and trained models are available at <url>https://github.com/NLP-Playground/LaSS</url>.</abstract>
       <url hash="37c63029">2021.acl-long.25</url>
@@ -2163,7 +2163,7 @@
       <author><first>Lin</first><last>Qiu</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>1993–2003</pages>
       <abstract>Recent work on non-autoregressive neural machine translation (NAT) aims at improving the efficiency by parallel decoding without sacrificing the quality. However, existing NAT methods are either inferior to Transformer or require multiple decoding passes, leading to reduced speedup. We propose the Glancing Language Model (GLM) for single-pass parallel generation models. With GLM, we develop Glancing Transformer (GLAT) for machine translation. With only single-pass parallel decoding, GLAT is able to generate high-quality translation with 8×-15× speedup. Note that GLAT does not modify the network architecture, which is a training method to learn word interdependency. Experiments on multiple WMT language directions show that GLAT outperforms all previous single pass non-autoregressive methods, and is nearly comparable to Transformer, reducing the gap to 0.25-0.9 BLEU points.</abstract>
       <url hash="82fe2afd">2021.acl-long.155</url>
@@ -3869,7 +3869,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <title>Document-level Event Extraction via Heterogeneous Graph-based Interaction Model with a Tracker</title>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
       <pages>3533–3546</pages>
       <abstract>Document-level event extraction aims to recognize event information from a whole piece of article. Existing methods are not effective due to two challenges of this task: a) the target event arguments are scattered across sentences; b) the correlation among events in a document is non-trivial to model. In this paper, we propose Heterogeneous Graph-based Interaction Model with a Tracker (GIT) to solve the aforementioned two challenges. For the first challenge, GIT constructs a heterogeneous graph interaction network to capture global interactions among different sentences and entity mentions. For the second, GIT introduces a Tracker module to track the extracted events and hence capture the interdependency among the events. Experiments on a large-scale dataset (Zheng et al, 2019) show GIT outperforms the previous methods by 2.8 F1. Further analysis reveals is effective in extracting multiple correlated events and event arguments that scatter across the document.</abstract>
@@ -7997,7 +7997,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Chun</first><last>Gan</last></author>
       <author><first>Zaixiang</first><last>Zheng</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>7361–7373</pages>
       <abstract>The choice of token vocabulary affects the performance of machine translation. This paper aims to figure out what is a good vocabulary and whether we can find the optimal vocabulary without trial training. To answer these questions, we first provide an alternative understanding of vocabulary from the perspective of information theory. It motivates us to formulate the quest of vocabularization – finding the best token dictionary with a proper size – as an optimal transport (OT) problem. We propose VOLT, a simple and efficient solution without trial training. Empirical results show that VOLT beats widely-used vocabularies in diverse scenarios, including WMT-14 English-German translation, TED bilingual translation, and TED multilingual translation. For example, VOLT achieves 70% vocabulary size reduction and 0.5 BLEU gain on English-German translation. Also, compared to BPE-search, VOLT reduces the search time from 384 GPU hours to 30 GPU hours on English-German translation. Codes are available at <url>https://github.com/Jingjing-NLP/VOLT</url>.</abstract>
       <url hash="bd59504c">2021.acl-long.571</url>
@@ -10453,7 +10453,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Qianqian</first><last>Dong</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>55–62</pages>
       <abstract>NeurST is an open-source toolkit for neural speech translation. The toolkit mainly focuses on end-to-end speech translation, which is easy to use, modify, and extend to advanced speech translation research and products. NeurST aims at facilitating the speech translation research for NLP researchers and building reliable benchmarks for this field. It provides step-by-step recipes for feature extraction, data preprocessing, distributed training, and evaluation. In this paper, we will introduce the framework design of NeurST and show experimental results for different benchmark datasets, which can be regarded as reliable baselines for future research. The toolkit is publicly available at <url>https://github.com/bytedance/neurst</url> and we will continuously update the performance of with other counterparts and studies at <url>https://st-benchmark.github.io/</url>.</abstract>
       <url hash="c0a0080b">2021.acl-demo.7</url>
diff --git a/data/xml/2021.eacl.xml b/data/xml/2021.eacl.xml
index 5cc30f41bc..c6ad527d06 100644
--- a/data/xml/2021.eacl.xml
+++ b/data/xml/2021.eacl.xml
@@ -3008,7 +3008,7 @@
       <author><first>Changzhi</first><last>Sun</last></author>
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Junchi</first><last>Yan</last></author>
       <pages>2877–2887</pages>
       <abstract>Current state-of-the-art systems for joint entity relation extraction (Luan et al., 2019; Wad-den et al., 2019) usually adopt the multi-task learning framework. However, annotations for these additional tasks such as coreference resolution and event extraction are always equally hard (or even harder) to obtain. In this work, we propose a pre-training method ENPAR to improve the joint extraction performance. ENPAR requires only the additional entity annotations that are much easier to collect. Unlike most existing works that only consider incorporating entity information into the sentence encoder, we further utilize the entity pair information. Specifically, we devise four novel objectives,i.e., masked entity typing, masked entity prediction, adversarial context discrimination, and permutation prediction, to pre-train an entity encoder and an entity pair encoder. Comprehensive experiments show that the proposed pre-training method achieves significant improvement over BERT on ACE05, SciERC, and NYT, and outperforms current state-of-the-art on ACE05.</abstract>
diff --git a/data/xml/2021.emnlp.xml b/data/xml/2021.emnlp.xml
index c2f1fe5fb3..6068a3f571 100644
--- a/data/xml/2021.emnlp.xml
+++ b/data/xml/2021.emnlp.xml
@@ -1301,7 +1301,7 @@
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>1239–1250</pages>
       <abstract>Document-level relation extraction aims to identify relations between entities in a whole document. Prior efforts to capture long-range dependencies have relied heavily on implicitly powerful representations learned through (graph) neural networks, which makes the model less transparent. To tackle this challenge, in this paper, we propose LogiRE, a novel probabilistic model for document-level relation extraction by learning logic rules. LogiRE treats logic rules as latent variables and consists of two modules: a rule generator and a relation extractor. The rule generator is to generate logic rules potentially contributing to final predictions, and the relation extractor outputs final predictions based on the generated logic rules. Those two modules can be efficiently optimized with the expectation-maximization (EM) algorithm. By introducing logic rules into neural networks, LogiRE can explicitly capture long-range dependencies as well as enjoy better interpretation. Empirical results show that significantly outperforms several strong baselines in terms of relation performance and logical consistency. Our code is available at <url>https://github.com/rudongyu/LogiRE</url>.</abstract>
       <url hash="e34e0708">2021.emnlp-main.95</url>
@@ -4705,7 +4705,7 @@
       <author><first>Zhiyuan</first><last>Zeng</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Weiran</first><last>Xu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>4102–4108</pages>
       <abstract>Neural abstractive summarization systems have gained significant progress in recent years. However, abstractive summarization often produce inconsisitent statements or false facts. How to automatically generate highly abstract yet factually correct summaries? In this paper, we proposed an efficient weak-supervised adversarial data augmentation approach to form the factual consistency dataset. Based on the artificial dataset, we train an evaluation model that can not only make accurate and robust factual consistency discrimination but is also capable of making interpretable factual errors tracing by backpropagated gradient distribution on token embeddings. Experiments and analysis conduct on public annotated summarization and factual consistency datasets demonstrate our approach effective and reasonable.</abstract>
       <url hash="fef4caa7">2021.emnlp-main.337</url>
@@ -7934,7 +7934,7 @@
       <author><first>Jun</first><last>Cao</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>7280–7290</pages>
       <abstract>How to effectively adapt neural machine translation (NMT) models according to emerging cases without retraining? Despite the great success of neural machine translation, updating the deployed models online remains a challenge. Existing non-parametric approaches that retrieve similar examples from a database to guide the translation process are promising but are prone to overfit the retrieved examples. However, non-parametric methods are prone to overfit the retrieved examples. In this work, we propose to learn Kernel-Smoothed Translation with Example Retrieval (KSTER), an effective approach to adapt neural machine translation models online. Experiments on domain adaptation and multi-domain machine translation datasets show that even without expensive retraining, KSTER is able to achieve improvement of 1.1 to 1.5 BLEU scores over the best existing online adaptation methods. The code and trained models are released at <url>https://github.com/jiangqn/KSTER</url>.</abstract>
       <url hash="09faadd8">2021.emnlp-main.579</url>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index 29c781856a..54401ea44f 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -2444,7 +2444,7 @@
       <author><first>Chi</first><last>Han</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Heng</first><last>Ji</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2214–2225</pages>
       <url hash="9ca4228f">2021.findings-acl.195</url>
       <doi>10.18653/v1/2021.findings-acl.195</doi>
@@ -3026,7 +3026,7 @@
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Xipeng</first><last>Qiu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2739–2750</pages>
       <url hash="467059aa">2021.findings-acl.242</url>
       <doi>10.18653/v1/2021.findings-acl.242</doi>
@@ -3300,7 +3300,7 @@
       <author><first>Liwei</first><last>Wu</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>3001–3007</pages>
       <url hash="66d3d754">2021.findings-acl.264</url>
       <doi>10.18653/v1/2021.findings-acl.264</doi>
@@ -8770,7 +8770,7 @@
       <title>Multilingual Translation via Grafting Pre-trained Language Models</title>
       <author><first>Zewei</first><last>Sun</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2735–2747</pages>
       <abstract>Can pre-trained BERT for one language and GPT for another be glued together to translate texts? Self-supervised training using only monolingual data has led to the success of pre-trained (masked) language models in many NLP tasks. However, directly connecting BERT as an encoder and GPT as a decoder can be challenging in machine translation, for GPT-like models lack a cross-attention component that is needed in seq2seq decoders. In this paper, we propose Graformer to graft separately pre-trained (masked) language models for machine translation. With monolingual data for pre-training and parallel data for grafting training, we maximally take advantage of the usage of both types of data. Experiments on 60 directions show that our method achieves average improvements of 5.8 BLEU in x2en and 2.9 BLEU in en2x directions comparing with the multilingual Transformer of the same size.</abstract>
       <url hash="80fa5c0d">2021.findings-emnlp.233</url>
@@ -8864,7 +8864,7 @@
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>2812–2823</pages>
       <abstract>Developing a unified multilingual model has been a long pursuing goal for machine translation. However, existing approaches suffer from performance degradation - a single multilingual model is inferior to separately trained bilingual ones on rich-resource languages. We conjecture that such a phenomenon is due to interference brought by joint training with multiple languages. To accommodate the issue, we propose CIAT, an adapted Transformer model with a small parameter overhead for multilingual machine translation. We evaluate CIAT on multiple benchmark datasets, including IWSLT, OPUS-100, and WMT. Experiments show that the CIAT consistently outperforms strong multilingual baselines on 64 of total 66 language directions, 42 of which have above 0.5 BLEU improvement.</abstract>
       <url hash="9676bc16">2021.findings-emnlp.240</url>
@@ -10963,7 +10963,7 @@
       <author><first>Tao</first><last>Wang</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Hang</first><last>Li</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
       <pages>4639–4644</pages>
diff --git a/data/xml/2021.iwslt.xml b/data/xml/2021.iwslt.xml
index 6582fc3c5b..894656ce75 100644
--- a/data/xml/2021.iwslt.xml
+++ b/data/xml/2021.iwslt.xml
@@ -110,7 +110,7 @@
       <author><first>Rong</first><last>Ye</last></author>
       <author><first>Qianqian</first><last>Dong</last></author>
       <author><first>Jun</first><last>Cao</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>64–74</pages>
       <abstract>This paper describes the systems submitted to IWSLT 2021 by the Volctrans team. We participate in the offline speech translation and text-to-text simultaneous translation tracks. For offline speech translation, our best end-to-end model achieves 7.9 BLEU improvements over the benchmark on the MuST-C test set and is even approaching the results of a strong cascade solution. For text-to-text simultaneous translation, we explore the best practice to optimize the wait-k model. As a result, our final submitted systems exceed the benchmark at around 7 BLEU on the same latency regime. We release our code and model to facilitate both future research works and industrial applications.</abstract>
       <url hash="5d4dfb8f">2021.iwslt-1.6</url>
diff --git a/data/xml/2021.naacl.xml b/data/xml/2021.naacl.xml
index d36faa17ca..08ce6ff0e0 100644
--- a/data/xml/2021.naacl.xml
+++ b/data/xml/2021.naacl.xml
@@ -6173,7 +6173,7 @@
       <title>Generative Imagination Elevates Machine Translation</title>
       <author><first>Quanyu</first><last>Long</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>5738–5748</pages>
       <abstract>There are common semantics shared across text and images. Given a sentence in a source language, whether depicting the visual scene helps translation into a target language? Existing multimodal neural machine translation methods (MNMT) require triplets of bilingual sentence - image for training and tuples of source sentence - image for inference. In this paper, we propose ImagiT, a novel machine translation method via visual imagination. ImagiT first learns to generate visual representation from the source sentence, and then utilizes both source sentence and the “imagined representation” to produce a target translation. Unlike previous methods, it only needs the source sentence at the inference time. Experiments demonstrate that ImagiT benefits from visual imagination and significantly outperforms the text-only neural machine translation baselines. Further analysis reveals that the imagination process in ImagiT helps fill in missing information when performing the degradation strategy.</abstract>
       <url hash="2a5a5564">2021.naacl-main.457</url>
@@ -7335,7 +7335,7 @@
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Hongxiao</first><last>Bai</last></author>
       <author><first>Hai</first><last>Zhao</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>89–96</pages>
       <abstract>We propose to improve unsupervised neural machine translation with cross-lingual supervision (), which utilizes supervision signals from high resource language pairs to improve the translation of zero-source languages. Specifically, for training En-Ro system without parallel corpus, we can leverage the corpus from En-Fr and En-De to collectively train the translation from one language into many languages under one model. % is based on multilingual models which require no changes to the standard unsupervised NMT. Simple and effective, significantly improves the translation quality with a big margin in the benchmark unsupervised translation tasks, and even achieves comparable performance to supervised NMT. In particular, on WMT’14 -tasks achieves 37.6 and 35.18 BLEU score, which is very close to the large scale supervised setting and on WMT’16 -tasks achieves 35.09 BLEU score which is even better than the supervised Transformer baseline.</abstract>
       <url hash="83973cc2">2021.naacl-industry.12</url>
@@ -7361,7 +7361,7 @@
       <author><first>Tao</first><last>Wang</last></author>
       <author><first>Chengqi</first><last>Zhao</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
       <pages>105–112</pages>
       <abstract>Automatic translation of dialogue texts is a much needed demand in many real life scenarios. However, the currently existing neural machine translation delivers unsatisfying results. In this paper, we conduct a deep analysis of a dialogue corpus and summarize three major issues on dialogue translation, including pronoun dropping (), punctuation dropping (), and typos (). In response to these challenges, we propose a joint learning method to identify omission and typo, and utilize context to translate dialogue utterances. To properly evaluate the performance, we propose a manually annotated dataset with 1,931 Chinese-English parallel utterances from 300 dialogues as a benchmark testbed for dialogue translation. Our experiments show that the proposed method improves translation quality by 3.2 BLEU over the baselines. It also elevates the recovery rate of omitted pronouns from 26.09% to 47.16%. We will publish the code and dataset publicly at https://xxx.xx.</abstract>
@@ -7376,7 +7376,7 @@
       <author><first>Ying</first><last>Xiong</last></author>
       <author><first>Yang</first><last>Wei</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>113–120</pages>
       <abstract>Transformer and its variants have achieved great success in natural language processing. Since Transformer models are huge in size, serving these models is a challenge for real industrial applications. In this paper, we propose , a highly efficient inference library for models in the Transformer family. includes a series of GPU optimization techniques to both streamline the computation of Transformer layers and reduce memory footprint. supports models trained using PyTorch and Tensorflow. Experimental results on standard machine translation benchmarks show that achieves up to 14x speedup compared with TensorFlow and 1.4x speedup compared with , a concurrent CUDA implementation. The code will be released publicly after the review.</abstract>
       <url hash="288e7385">2021.naacl-industry.15</url>
diff --git a/data/xml/2021.wmt.xml b/data/xml/2021.wmt.xml
index c9bed4b19a..7633cb4f0d 100644
--- a/data/xml/2021.wmt.xml
+++ b/data/xml/2021.wmt.xml
@@ -259,7 +259,7 @@
       <author><first>Zehui</first><last>Lin</last></author>
       <author><first>Jiangtao</first><last>Feng</last></author>
       <author><first>Shanbo</first><last>Cheng</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Mingxuan</first><last>Wang</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <pages>187–196</pages>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 3cf3a0f0f9..1d66490920 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -13046,7 +13046,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
     <paper id="370">
       <title>Distillation-Resistant Watermarking for Model Protection in <fixed-case>NLP</fixed-case></title>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>Yu-Xiang</first><last>Wang</last><affiliation>UCSB</affiliation></author>
       <pages>5044-5055</pages>
       <abstract>How can we protect the intellectual property of trained NLP models? Modern NLP models are prone to stealing by querying and distilling from their publicly exposed APIs. However, existing protection methods such as watermarking only work for images but are not applicable to text. We propose Distillation-Resistant Watermarking (DRW), a novel technique to protect NLP models from being stolen via distillation. DRW protects a model by injecting watermarks into the victim’s prediction probability corresponding to a secret key and is able to detect such a key by probing a suspect model. We prove that a protected model still retains the original accuracy within a certain bound. We evaluate DRW on a diverse set of NLP tasks including text classification, part-of-speech tagging, and named entity recognition. Experiments show that DRW protects the original model and detects stealing suspects at 100% mean average precision for all four tasks while the prior method fails on two.</abstract>
@@ -13946,7 +13946,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Yifan</first><last>Song</last><affiliation>Peking University</affiliation></author>
       <author><first>Jingjing</first><last>Xu</last><affiliation>Shanghai AI Lab</affiliation></author>
       <author><first>Zhifang</first><last>Sui</last><affiliation>Peking University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>5937-5947</pages>
       <abstract>Previous literature has proved that Pretrained Language Models (PLMs) can store factual knowledge. However, we find that facts stored in the PLMs are not always correct. It motivates us to explore a fundamental question: How do we calibrate factual knowledge in PLMs without re-training from scratch? In this work, we propose a simple and lightweight method CaliNet to achieve this goal. To be specific, we first detect whether PLMs can learn the right facts via a contrastive score between right and fake facts. If not, we then use a lightweight method to add and adapt new parameters to specific factual texts. Experiments on the knowledge probing task show the calibration effectiveness and efficiency. In addition, through closed-book question answering, we find that the calibrated PLM possesses knowledge generalization ability after finetuning.Beyond the calibration performance, we further investigate and visualize the knowledge calibration mechanism.</abstract>
       <url hash="1649bf53">2022.findings-emnlp.438</url>
@@ -14613,7 +14613,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Yi-Lin</first><last>Tuan</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Yujie</first><last>Lu</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Michael</first><last>Saxon</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>Unversity of California, Santa Barbara</affiliation></author>
       <pages>6559-6574</pages>
       <abstract>Is it possible to build a general and automatic natural language generation (NLG) evaluation metric? Existing learned metrics either perform unsatisfactorily or are restricted to tasks where large human rating data is already available. We introduce SESCORE, a model-based metric that is highly correlated with human judgements without requiring human annotation, by utilizing a novel, iterative error synthesis and severity scoring pipeline. This pipeline applies a series of plausible errors to raw text and assigns severity labels by simulating human judgements with entailment. We evaluate SESCORE against existing metrics by comparing how their scores correlate with human ratings. SESCORE outperforms all prior unsupervised metrics on multiple diverse NLG tasks including machine translation, image captioning, and WebNLG text generation. For WMT 20/21En-De and Zh-En, SESCORE improve the average Kendall correlation with human judgement from 0.154 to 0.195. SESCORE even achieves comparable performance to the best supervised metric COMET, despite receiving no human annotated training data.</abstract>
diff --git a/data/xml/2022.iwslt.xml b/data/xml/2022.iwslt.xml
index 3525f423fa..3a52524fee 100644
--- a/data/xml/2022.iwslt.xml
+++ b/data/xml/2022.iwslt.xml
@@ -112,7 +112,7 @@
       <title>On the Impact of Noises in Crowd-Sourced Data for Speech Translation</title>
       <author><first>Siqi</first><last>Ouyang</last></author>
       <author><first>Rong</first><last>Ye</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>92-97</pages>
       <abstract>Training speech translation (ST) models requires large and high-quality datasets. MuST-C is one of the most widely used ST benchmark datasets. It contains around 400 hours of speech-transcript-translation data for each of the eight translation directions. This dataset passes several quality-control filters during creation. However, we find that MuST-C still suffers from three major quality issues: audiotext misalignment, inaccurate translation, and unnecessary speaker’s name. What are the impacts of these data quality issues for model development and evaluation? In this paper, we propose an automatic method to fix or filter the above quality issues, using English-German (En-De) translation as an example. Our experiments show that ST models perform better on clean test sets, and the rank of proposed models remains consistent across different test sets. Besides, simply removing misaligned data points from the training set does not lead to a better ST model.</abstract>
       <url hash="5f7124cd">2022.iwslt-1.9</url>
diff --git a/data/xml/2023.emnlp.xml b/data/xml/2023.emnlp.xml
index ee7dd7e37b..9c00b0fd08 100644
--- a/data/xml/2023.emnlp.xml
+++ b/data/xml/2023.emnlp.xml
@@ -5132,7 +5132,7 @@
       <author><first>Zhenqiao</first><last>Song</last></author>
       <author><first>Markus</first><last>Freitag</last></author>
       <author><first>William</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>5967-5994</pages>
       <abstract>Automatically evaluating the quality of language generation is critical. Although recent learned metrics show high correlation with human judgement, these metrics do not provide explicit explanation of their verdict, nor associate the scores with defects in the generated text. To address this limitation, we present INSTRUCTSCORE, a fine-grained explainable evaluation metric for text generation. By harnessing both explicit human instruction and the implicit knowledge of GPT-4, we fine-tune a text evaluation metric based on LLaMA, producing both a score for generated text and a human readable diagnostic report. We evaluate INSTRUCTSCORE on a variety of generation tasks, including translation, captioning, data-to-text, and commonsense generation. Experiments show that our 7B model surpasses all other unsupervised metrics, including those based on 175B GPT-3 and GPT-4. Surprisingly, our INSTRUCTSCORE, even without direct supervision from human-rated data, achieves performance levels on par with state-of-the-art metrics like COMET22, which were fine-tuned on human ratings.</abstract>
       <url hash="67ecf0cc">2023.emnlp-main.365</url>
@@ -9223,7 +9223,7 @@
     <paper id="659">
       <title>Learning from Mistakes via Cooperative Study Assistant for Large Language Models</title>
       <author><first>Danqing</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>10667-10685</pages>
       <abstract>Large language models (LLMs) have demonstrated their potential to refine their generation based on their own feedback. However, the feedback from LLM itself is often inaccurate, thereby limiting its benefits. In this paper, we propose Study Assistant for Large LAnguage Model (SALAM), a novel framework with an auxiliary agent to assist the main LLM in learning from mistakes through interactive cooperation. In the gathering phase, the student assistant agent probes the main LLM, analyzes its errors, and collects the interaction in a mistake memory. During the examination phase, the study assistant provides guidelines by retrieving relevant cases to help the main LLM anticipate and avoid similar errors. We first investigate the effectiveness of a general study assistant and then customize it to provide LLM-specific guidance through imitation learning from successful guidance experiences. Our experiments on three LLMs using two challenging frameworks demonstrate that SALAM can significantly boost LLMs by an accuracy margin of up to 6.6 on BBH and 12.6 on BBQ.</abstract>
       <url hash="36ec977f">2023.emnlp-main.659</url>
diff --git a/data/xml/2023.findings.xml b/data/xml/2023.findings.xml
index b67818d037..08375137ea 100644
--- a/data/xml/2023.findings.xml
+++ b/data/xml/2023.findings.xml
@@ -17331,7 +17331,7 @@
     <paper id="205">
       <title><fixed-case>A</fixed-case>uto<fixed-case>P</fixed-case>lan: Automatic Planning of Interactive Decision-Making Tasks With Large Language Models</title>
       <author><first>Siqi</first><last>Ouyang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>3114-3128</pages>
       <abstract>Recent large language models (LLMs) are promising for making decisions in grounded environments. However, LLMs frequently fail in complex decision-making tasks due to the misalignment between the pre-trained knowledge in LLMs and the actual rules in the environment. Existing methods require either costly gradient computation or lengthy in-context demonstrations. In this paper, we propose AutoPlan, an approach to guide LLM-based agents to accomplish interactive decision-making tasks. AutoPlan augments the LLM prompt with a task-solving plan and optimizes it through iterative experience collection and reflection. Our experiments show that AutoPlan, though using no in-context demonstrations, achieves success rates on par with the baselines using human-written demonstrations on ALFWorld and even outperforms them by 8% on HotpotQA. The code is available at https://github.com/owaski/AutoPlan.</abstract>
       <url hash="225682fd">2023.findings-emnlp.205</url>
@@ -28056,7 +28056,7 @@
       <author><first>Bohong</first><last>Wu</last></author>
       <author><first>Fei</first><last>Yuan</last></author>
       <author><first>Hai</first><last>Zhao</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <pages>15432-15444</pages>
       <abstract>Multilingual understanding models (or encoder-based), pre-trained via masked language modeling, have achieved promising results on many language understanding tasks (e.g., mBERT). However, these models are not capable of generating high-quality text compared with decoder-based causal language models. Can we transform a pre-trained language understanding model into an effective language generation model? We propose a Semantic-Guided Alignment-then-Denoising (SGA) approach to adapt a multilingual encoder to a multilingual generator with a small number of additional parameters. Experiments show that the proposed approach is an effective adaption method, outperforming widely-used initialization-based methods with gains of 9.4 BLEU on machine translation, 8.1 Rouge-L on question generation, and 5.5 METEOR on story generation on XLM-R<tex-math>_{large}</tex-math>. On the other hand, we observe that XLM-R is still inferior to mBART in supervised settings despite better results on zero-shot settings, indicating that more exploration is required to make understanding models strong generators. Our code is available at https://github.com/chengzhipanpan/XLMR4MT.</abstract>
diff --git a/data/xml/2024.acl.xml b/data/xml/2024.acl.xml
index 0a00862971..68e647310f 100644
--- a/data/xml/2024.acl.xml
+++ b/data/xml/2024.acl.xml
@@ -11575,7 +11575,7 @@
       <author><first>Guanglei</first><last>Zhu</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Xuandong</first><last>Zhao</last><affiliation>University of California, Berkeley</affiliation></author>
       <author><first>Liangming</first><last>Pan</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
       <pages>15474-15492</pages>
       <abstract>Recent studies show that large language models (LLMs) improve their performance through self-feedback on certain tasks while degrade on others. We discovered that such a contrary is due to LLM’s bias in evaluating their own output. In this paper, we formally define LLM’s self-bias – the tendency to favor its own generation – using two statistics. We analyze six LLMs (GPT-4, GPT-3.5, Gemini, LLaMA2, Mixtral and DeepSeek) on translation, constrained text generation, and mathematical reasoning tasks. We find that self-bias is prevalent in all examined LLMs across multiple languages and tasks. Our analysis reveals that while the self-refine pipeline improves the fluency and understandability of model outputs, it further amplifies self-bias. To mitigate such biases, we discover that larger model size and external feedback with accurate assessment can significantly reduce bias in the self-refine pipeline, leading to actual performance improvement in downstream tasks. The code and data are released at https://github.com/xu1998hz/llm_self_bias.</abstract>
diff --git a/data/xml/2024.findings.xml b/data/xml/2024.findings.xml
index 2b12bb3577..bd20b55e17 100644
--- a/data/xml/2024.findings.xml
+++ b/data/xml/2024.findings.xml
@@ -3228,7 +3228,7 @@
       <author><first>Biao</first><last>Zhang</last><affiliation>Google DeepMind</affiliation></author>
       <author><first>Zhongtao</first><last>Liu</last><affiliation>Google</affiliation></author>
       <author><first>William Yang</first><last>Wang</last><affiliation>UC Santa Barbara</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <author><first>Markus</first><last>Freitag</last><affiliation>Google</affiliation></author>
       <pages>1429-1445</pages>
       <abstract>Recent large language models (LLM) areleveraging human feedback to improve theirgeneration quality. However, human feedbackis costly to obtain, especially during inference.In this work, we propose LLMRefine, aninference time optimization method to refineLLM’s output. The core idea is to usea learned fine-grained feedback model topinpoint defects and guide LLM to refinethem iteratively. Using original LLM as aproposal of edits, LLMRefine searches fordefect-less text via simulated annealing, tradingoff the exploration and exploitation. Weconduct experiments on three text generationtasks, including machine translation, long-form question answering (QA), and topicalsummarization. LLMRefine consistentlyoutperforms all baseline approaches, achievingimprovements up to 1.7 MetricX points ontranslation tasks, 8.1 ROUGE-L on ASQA, 2.2ROUGE-L on topical summarization.</abstract>
@@ -4399,7 +4399,7 @@
       <author><first>Shujian</first><last>Huang</last><affiliation>Nanjing University</affiliation></author>
       <author><first>Lingpeng</first><last>Kong</last><affiliation>Department of Computer Science, The University of Hong Kong</affiliation></author>
       <author><first>Jiajun</first><last>Chen</last><affiliation>Nanjing University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>School of Computer Science, Carnegie Mellon University</affiliation></author>
       <pages>2765-2781</pages>
       <abstract>Large language models (LLMs) have demonstrated remarkable potential in handling multilingual machine translation (MMT). In this paper, we systematically investigate the advantages and challenges of LLMs for MMT by answering two questions: 1) How well do LLMs perform in translating massive languages? 2) Which factors affect LLMs’ performance in translation? We thoroughly evaluate eight popular LLMs, including ChatGPT and GPT-4. Our empirical results show that translation capabilities of LLMs are continually involving. GPT-4 has beat the strong supervised baseline NLLB in 40.91% of translation directions but still faces a large gap towards the commercial translation system like Google Translate, especially on low-resource languages. Through further analysis, we discover that LLMs exhibit new working patterns when used for MMT. First, LLM can acquire translation ability in a resource-efficient way and generate moderate translation even on zero-resource languages. Second, instruction semantics can surprisingly be ignored when given in-context exemplars. Third, cross-lingual exemplars can provide better task guidance for low-resource translation than exemplars in the same language pairs. Code will be released at: https://github.com/NJUNLP/MMT-LLM.</abstract>
       <url hash="321e3b0c">2024.findings-naacl.176</url>
diff --git a/data/xml/2024.iwslt.xml b/data/xml/2024.iwslt.xml
index a824817398..fba61187d5 100644
--- a/data/xml/2024.iwslt.xml
+++ b/data/xml/2024.iwslt.xml
@@ -328,7 +328,7 @@
       <author><first>Brian</first><last>Yan</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Patrick</first><last>Fernandes</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Chen</last><affiliation>Carnegie Mellon University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Graham</first><last>Neubig</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Shinji</first><last>Watanabe</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>154-159</pages>
@@ -366,7 +366,7 @@
       <author><first>Siqi</first><last>Ouyang</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>William</first><last>Chen</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Karen</first><last>Livescu</last><affiliation>TTI-Chicago</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Graham</first><last>Neubig</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Shinji</first><last>Watanabe</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>164-169</pages>
diff --git a/data/xml/2025.coling.xml b/data/xml/2025.coling.xml
index a7ac61845a..cd3265a9a1 100644
--- a/data/xml/2025.coling.xml
+++ b/data/xml/2025.coling.xml
@@ -6219,7 +6219,7 @@
       <author><first>Zhaojiang</first><last>Lin</last></author>
       <author><first>Yuning</first><last>Mao</last></author>
       <author><first>William Yang</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Yi-Chia</first><last>Wang</last></author>
       <pages>7819–7830</pages>
       <abstract>From ice cream flavors to climate change, people exhibit a wide array of opinions on various topics, and understanding the rationale for these opinions can promote healthy discussion and consensus among them. As such, it can be valuable for a large language model (LLM), particularly as an AI assistant, to be able to empathize with or even explain these various standpoints. In this work, we hypothesize that different topic stances often manifest correlations that can be used to extrapolate to topics with unknown opinions. We explore various prompting and fine-tuning methods to improve an LLM’s ability to (a) extrapolate from opinions on known topics to unknown ones and (b) support their extrapolation with reasoning. Our findings suggest that LLMs possess inherent knowledge from training data about these opinion correlations, and with minimal data, the similarities between human opinions and model-extrapolated opinions can be improved by more than 50%. Furthermore, LLM can generate the reasoning process behind their extrapolation of opinions.</abstract>
diff --git a/data/xml/2025.iwslt.xml b/data/xml/2025.iwslt.xml
index 1696407540..fe3e308388 100644
--- a/data/xml/2025.iwslt.xml
+++ b/data/xml/2025.iwslt.xml
@@ -406,7 +406,7 @@
       <title><fixed-case>CMU</fixed-case>’s <fixed-case>IWSLT</fixed-case> 2025 Simultaneous Speech Translation System</title>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>Carnegie Mellon University</affiliation></author>
       <author><first>Xi</first><last>Xu</last><affiliation>Carnegie Mellon University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>Carnegie Mellon University</affiliation></author>
       <pages>309-314</pages>
       <abstract>This paper presents CMU’s submission to the IWSLT 2025 Simultaneous Speech Translation (SST) task for translating unsegmented English speech into Chinese and German text in a streaming manner. Our end-to-end speech-to-text system integrates a chunkwise causal Wav2Vec 2.0 speech encoder, an adapter, and the Qwen2.5-7B-Instruct as the decoder. We use a two-stage simultaneous training procedure on robust speech segments synthesized from LibriSpeech, CommonVoice, and VoxPopuli datasets, utilizing standard cross-entropy loss. Our model supports adjustable latency through a configurable latency multiplier. Experimental results demonstrate that our system achieves 44.3 BLEU for English-to-Chinese and 25.1 BLEU for English-to-German translations on the ACL60/60 development set, with computation-aware latencies of 2.7 seconds and 2.3 seconds, and theoretical latencies of 2.2 and 1.7 seconds, respectively.</abstract>
       <url hash="d0c14aba">2025.iwslt-1.31</url>
diff --git a/data/xml/D18.xml b/data/xml/D18.xml
index d995e57508..38e37e4496 100644
--- a/data/xml/D18.xml
+++ b/data/xml/D18.xml
@@ -6212,7 +6212,7 @@
       <author><first>Haoyue</first><last>Shi</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>4631–4641</pages>
       <url hash="5e10b91f">D18-1492</url>
       <attachment type="attachment" hash="5aea7c87">D18-1492.Attachment.zip</attachment>
diff --git a/data/xml/D19.xml b/data/xml/D19.xml
index 061437e9ca..75635449b7 100644
--- a/data/xml/D19.xml
+++ b/data/xml/D19.xml
@@ -953,7 +953,7 @@
       <author><first>Zhixing</first><last>Tan</last></author>
       <author><first>Jinsong</first><last>Su</last></author>
       <author><first>Deyi</first><last>Xiong</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>803–812</pages>
       <abstract>In this study, we first investigate a novel capsule network with dynamic routing for linear time Neural Machine Translation (NMT), referred as CapsNMT. CapsNMT uses an aggregation mechanism to map the source sentence into a matrix with pre-determined size, and then applys a deep LSTM network to decode the target sequence from the source representation. Unlike the previous work (CITATION) to store the source sentence with a passive and bottom-up way, the dynamic routing policy encodes the source sentence with an iterative process to decide the credit attribution between nodes from lower and higher layers. CapsNMT has two core properties: it runs in time that is linear in the length of the sequences and provides a more flexible way to aggregate the part-whole information of the source sentence. On WMT14 English-German task and a larger WMT14 English-French task, CapsNMT achieves comparable results with the Transformer system. To the best of our knowledge, this is the first work that capsule networks have been empirically investigated for sequence to sequence problems.</abstract>
       <url hash="08fdfea0">D19-1074</url>
@@ -4288,7 +4288,7 @@
       <author><first>Fuli</first><last>Luo</last></author>
       <author><first>Shunyao</first><last>Li</last></author>
       <author><first>Pengcheng</first><last>Yang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
       <author><first>Zhifang</first><last>Sui</last></author>
       <author><first>Xu</first><last>Sun</last></author>
diff --git a/data/xml/N18.xml b/data/xml/N18.xml
index 1d475291bb..8471d0c101 100644
--- a/data/xml/N18.xml
+++ b/data/xml/N18.xml
@@ -1409,7 +1409,7 @@
     <paper id="113">
       <title>Reinforced Co-Training</title>
       <author><first>Jiawei</first><last>Wu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>William Yang</first><last>Wang</last></author>
       <pages>1252–1262</pages>
       <abstract>Co-training is a popular semi-supervised learning framework to utilize a large amount of unlabeled data in addition to a small labeled set. Co-training methods exploit predicted labels on the unlabeled data and select samples based on prediction confidence to augment the training. However, the selection of samples in existing co-training methods is based on a predetermined policy, which ignores the sampling bias between the unlabeled and the labeled subsets, and fails to explore the data space. In this paper, we propose a novel method, Reinforced Co-Training, to select high-quality unlabeled samples to better co-train on. More specifically, our approach uses Q-learning to learn a data selection policy with a small labeled dataset, and then exploits this policy to train the co-training classifiers automatically. Experimental results on clickbait detection and generic text classification tasks demonstrate that our proposed method can obtain more accurate text classification results.</abstract>
diff --git a/data/xml/P16.xml b/data/xml/P16.xml
index 4010ce6a2d..03b1a5bcd3 100644
--- a/data/xml/P16.xml
+++ b/data/xml/P16.xml
@@ -817,7 +817,7 @@
     <paper id="76">
       <title><fixed-case>CFO</fixed-case>: Conditional Focused Neural Question Answering with Large-scale Knowledge Bases</title>
       <author><first>Zihang</first><last>Dai</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Wei</first><last>Xu</last></author>
       <pages>800–810</pages>
       <url hash="0526478f">P16-1076</url>
diff --git a/data/xml/P19.xml b/data/xml/P19.xml
index 973cf97486..0e563d8546 100644
--- a/data/xml/P19.xml
+++ b/data/xml/P19.xml
@@ -2488,7 +2488,7 @@
     <paper id="193">
       <title>Enhancing Topic-to-Essay Generation with External Commonsense Knowledge</title>
       <author><first>Pengcheng</first><last>Yang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Fuli</first><last>Luo</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Xu</first><last>Sun</last></author>
@@ -3286,7 +3286,7 @@
       <author><first>Pengcheng</first><last>Yang</last></author>
       <author id="zhihan-zhang"><first>Zhihan</first><last>Zhang</last></author>
       <author><first>Fuli</first><last>Luo</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Chengyang</first><last>Huang</last></author>
       <author><first>Xu</first><last>Sun</last></author>
       <pages>2680–2686</pages>
@@ -7124,7 +7124,7 @@
       <author><first>Huangzhao</first><last>Zhang</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Ning</first><last>Miao</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>5564–5569</pages>
       <abstract>Efficiently building an adversarial attacker for natural language processing (NLP) tasks is a real challenge. Firstly, as the sentence space is discrete, it is difficult to make small perturbations along the direction of gradients. Secondly, the fluency of the generated examples cannot be guaranteed. In this paper, we propose MHA, which addresses both problems by performing Metropolis-Hastings sampling, whose proposal is designed with the guidance of gradients. Experiments on IMDB and SNLI show that our proposed MHAoutperforms the baseline model on attacking capability. Adversarial training with MHA also leads to better robustness and performance.</abstract>
       <url hash="ccbfd155">P19-1559</url>
@@ -7669,7 +7669,7 @@
       <author><first>Yu</first><last>Bao</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Shujian</first><last>Huang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Lili</first><last>Mou</last></author>
       <author><first>Olga</first><last>Vechtomova</last></author>
       <author><first>Xin-yu</first><last>Dai</last></author>
@@ -7853,7 +7853,7 @@
       <author><first>Yunxuan</first><last>Xiao</last></author>
       <author><first>Yanru</first><last>Qu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmmu"><first>Lei</first><last>Li</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
       <pages>6140–6150</pages>
@@ -8732,7 +8732,7 @@
       <title>Automatic Generation of Personalized Comment Based on User Profile</title>
       <author><first>Wenhuan</first><last>Zeng</last></author>
       <author><first>Abulikemu</first><last>Abuduweili</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Pengcheng</first><last>Yang</last></author>
       <pages>229–235</pages>
       <abstract>Comments on social media are very diverse, in terms of content, style and vocabulary, which make generating comments much more challenging than other existing natural language generation (NLG) tasks. Besides, since different user has different expression habits, it is necessary to take the user’s profile into consideration when generating comments. In this paper, we introduce the task of automatic generation of personalized comment (AGPC) for social media. Based on tens of thousands of users’ real comments and corresponding user profiles on weibo, we propose Personalized Comment Generation Network (PCGN) for AGPC. The model utilizes user feature embedding with a gated memory and attends to user description to model personality of users. In addition, external user representation is taken into consideration during the decoding to enhance the comments generation. Experimental results show that our model can generate natural, human-like and personalized comments.</abstract>
diff --git a/data/xml/W19.xml b/data/xml/W19.xml
index 51ef0d3e4e..0df0123831 100644
--- a/data/xml/W19.xml
+++ b/data/xml/W19.xml
@@ -17436,7 +17436,7 @@ In this tutorial on MT and post-editing we would like to continue sharing the la
       <author><first>Yao</first><last>Fu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>24–33</pages>
       <abstract>Text attribute transfer is modifying certain linguistic attributes (e.g. sentiment, style, author-ship, etc.) of a sentence and transforming them from one type to another. In this paper, we aim to analyze and interpret what is changed during the transfer process. We start from the observation that in many existing models and datasets, certain words within a sentence play important roles in determining the sentence attribute class. These words are referred as the Pivot Words. Based on these pivot words, we propose a lexical analysis framework, the Pivot Analysis, to quantitatively analyze the effects of these words in text attribute classification and transfer. We apply this framework to existing datasets and models and show that: (1) the pivot words are strong features for the classification of sentence attributes; (2) to change the attribute of a sentence, many datasets only requires to change certain pivot words; (3) consequently, many transfer models only perform the lexical-level modification,while leaving higher-level sentence structures unchanged. Our work provides an in-depth understanding of linguistic attribute transfer and further identifies the future requirements and challenges of this task</abstract>
       <url hash="496b647a">W19-8604</url>

From e3c16980e79f9afee4fe3cd2fc40277ca9e83d11 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 01:57:26 +0100
Subject: [PATCH 05/19] add more entries to `lei-li-hku` based on personal
 cv/website

`cv-LILEI-2501.pdf`
---
 data/xml/2021.emnlp.xml    | 2 +-
 data/xml/2021.findings.xml | 2 +-
 data/xml/2022.findings.xml | 2 +-
 data/xml/2023.emnlp.xml    | 4 ++--
 data/xml/2024.acl.xml      | 4 ++--
 5 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/data/xml/2021.emnlp.xml b/data/xml/2021.emnlp.xml
index 6068a3f571..587d87fdda 100644
--- a/data/xml/2021.emnlp.xml
+++ b/data/xml/2021.emnlp.xml
@@ -432,7 +432,7 @@
     </paper>
     <paper id="31">
       <title>Dynamic Knowledge Distillation for Pre-trained Language Models</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Yankai</first><last>Lin</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
       <author><first>Peng</first><last>Li</last></author>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index 54401ea44f..d1de8d38bb 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -6240,7 +6240,7 @@
     </paper>
     <paper id="43">
       <title><fixed-case>C</fixed-case>ascade<fixed-case>BERT</fixed-case>: Accelerating Inference of Pre-trained Language Models via Calibrated Complete Models Cascade</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Yankai</first><last>Lin</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Shuhuai</first><last>Ren</last></author>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 1d66490920..94322d177d 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -14453,7 +14453,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
     </paper>
     <paper id="477">
       <title>From Mimicking to Integrating: Knowledge Integration for Pre-Trained Language Models</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author><first>Yankai</first><last>Lin</last><affiliation>Gaoling School of Artificial Intelligence, Renmin University of China</affiliation></author>
       <author><first>Xuancheng</first><last>Ren</last><affiliation>Peking University</affiliation></author>
       <author><first>Guangxiang</first><last>Zhao</last><affiliation>Peking University</affiliation></author>
diff --git a/data/xml/2023.emnlp.xml b/data/xml/2023.emnlp.xml
index 9c00b0fd08..1455cdd5b6 100644
--- a/data/xml/2023.emnlp.xml
+++ b/data/xml/2023.emnlp.xml
@@ -8511,7 +8511,7 @@
     <paper id="609">
       <title>Label Words are Anchors: An Information Flow Perspective for Understanding In-Context Learning</title>
       <author><first>Lean</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
@@ -10152,7 +10152,7 @@
     </paper>
     <paper id="726">
       <title>Can Language Models Understand Physical Concepts?</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
       <author><first>Ce</first><last>Zheng</last></author>
diff --git a/data/xml/2024.acl.xml b/data/xml/2024.acl.xml
index 68e647310f..3f1bd5a505 100644
--- a/data/xml/2024.acl.xml
+++ b/data/xml/2024.acl.xml
@@ -7096,7 +7096,7 @@
     <paper id="511">
       <title>Large Language Models are not Fair Evaluators</title>
       <author><first>Peiyi</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Liang</first><last>Chen</last></author>
       <author><first>Zefan</first><last>Cai</last></author>
       <author><first>Dawei</first><last>Zhu</last></author>
@@ -10832,7 +10832,7 @@
     </paper>
     <paper id="775">
       <title>Multimodal <fixed-case>A</fixed-case>r<fixed-case>X</fixed-case>iv: A Dataset for Improving Scientific Comprehension of Large Vision-Language Models</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Yuqi</first><last>Wang</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Runxin</first><last>Xu</last><affiliation>Peking University</affiliation></author>
       <author><first>Peiyi</first><last>Wang</last><affiliation>Peking University</affiliation></author>

From e74e1c255ece5adf6d7d6e0c4585aa4b3ce4e34b Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 02:28:25 +0100
Subject: [PATCH 06/19] add more entries to `lei-li-hku/cmu`

- based on cmu personal website of publications
- hku google scholar
---
 data/xml/2021.findings.xml    | 2 +-
 data/xml/2023.americasnlp.xml | 2 +-
 data/xml/2024.acl.xml         | 4 ++--
 data/xml/2024.naacl.xml       | 2 +-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index d1de8d38bb..f8b3ca72d9 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -3464,7 +3464,7 @@
       <author><first>Yuanbin</first><last>Wu</last></author>
       <author><first>Jiaze</first><last>Chen</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>3140–3151</pages>
       <url hash="4337b7fe">2021.findings-acl.277</url>
       <doi>10.18653/v1/2021.findings-acl.277</doi>
diff --git a/data/xml/2023.americasnlp.xml b/data/xml/2023.americasnlp.xml
index 5f13fb31f4..77e2132a93 100644
--- a/data/xml/2023.americasnlp.xml
+++ b/data/xml/2023.americasnlp.xml
@@ -230,7 +230,7 @@
       <author><first>Tianrui</first><last>Gu</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Kaie</first><last>Chen</last><affiliation>University of California, Santa Barbara</affiliation></author>
       <author><first>Siqi</first><last>Ouyang</last><affiliation>University of California, Santa Barbara</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>University of California Santa Barbara</affiliation></author>
       <pages>173-176</pages>
       <abstract>This paper presents PlayGround’s submission to the AmericasNLP 2023 shared task on machine translation (MT) into indigenous languages. We finetuned NLLB-600M, a multilingual MT model pre-trained on Flores-200, on 10 low-resource language directions and examined the effectiveness of weight averaging and back translation. Our experiments showed that weight averaging, on average, led to a 0.0169 improvement in the ChrF++ score. Additionally, we found that back translation resulted in a 0.008 improvement in the ChrF++ score.</abstract>
       <url hash="70c4244c">2023.americasnlp-1.19</url>
diff --git a/data/xml/2024.acl.xml b/data/xml/2024.acl.xml
index 3f1bd5a505..66a5ff717f 100644
--- a/data/xml/2024.acl.xml
+++ b/data/xml/2024.acl.xml
@@ -7079,7 +7079,7 @@
     <paper id="510">
       <title>Math-Shepherd: Verify and Reinforce <fixed-case>LLM</fixed-case>s Step-by-step without Human Annotations</title>
       <author><first>Peiyi</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>University of Hong Kong</affiliation></author>
       <author><first>Zhihong</first><last>Shao</last><affiliation>Tsinghua University, Tsinghua University</affiliation></author>
       <author><first>Runxin</first><last>Xu</last></author>
       <author><first>Damai</first><last>Dai</last></author>
@@ -14422,7 +14422,7 @@
       <title>Watermarking for Large Language Models</title>
       <author><first>Xuandong</first><last>Zhao</last></author>
       <author><first>Yu-Xiang</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>10-11</pages>
       <abstract>As AI-generated text increasingly resembles human-written content, the ability to detect machine-generated text becomes crucial in both the computational linguistics and machine learning communities. In this tutorial, we aim to provide an in-depth exploration of text watermarking, a subfield of linguistic steganography with the goal of embedding a hidden message (the watermark) within a text passage. We will introduce the fundamentals of text watermarking, discuss the main challenges in identifying AI-generated text, and delve into the current watermarking methods, assessing their strengths and weaknesses. Moreover, we will explore other possible applications of text watermarking and discuss future directions for this field. Each section will be supplemented with examples and key takeaways.</abstract>
       <url hash="d0e779a1">2024.acl-tutorials.6</url>
diff --git a/data/xml/2024.naacl.xml b/data/xml/2024.naacl.xml
index 134e936cfb..c291b40970 100644
--- a/data/xml/2024.naacl.xml
+++ b/data/xml/2024.naacl.xml
@@ -8700,7 +8700,7 @@
       <author><first>Muhao</first><last>Chen</last><affiliation>UC Davis</affiliation></author>
       <author><first>Chaowei</first><last>Xiao</last><affiliation>UW-Madison</affiliation></author>
       <author><first>Huan</first><last>Sun</last><affiliation>OSU</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>CMU</affiliation></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last><affiliation>CMU</affiliation></author>
       <author><first>Leon</first><last>Derczynski</last><affiliation>UW Seattle</affiliation></author>
       <author><first>Anima</first><last>Anandkumar</last><affiliation>Caltech, NVIDIA</affiliation></author>
       <author><first>Fei</first><last>Wang</last><affiliation>USC</affiliation></author>

From a17357d78de3573a4e844c7634510023719733f1 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 02:50:30 +0100
Subject: [PATCH 07/19] introducing `lei-li-bupt`

---
 data/yaml/name_variants.yaml | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index c70af33eef..7ac2003d36 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5751,6 +5751,11 @@
   orcid: 0009-0008-6984-5104
   comment: University of Hong Kong
   institution: University of Hong Kong
+- canonical: {first: Lei, last: Li}
+  id: lei-li-bupt
+  orcid: 0000-0002-3204-6527
+  comment: Beijing University of Posts and Telecommunications
+  institution: Beijing University of Posts and Telecommunications
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 39f974fe848346edcfe2a11781a5502a166a4857 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 02:51:50 +0100
Subject: [PATCH 08/19] add papers to `lei-li-bupt` based on
 openreview/affiliation

---
 data/xml/2020.sdp.xml      | 2 +-
 data/xml/2021.findings.xml | 2 +-
 data/xml/2022.aacl.xml     | 2 +-
 data/xml/2022.findings.xml | 2 +-
 data/xml/2024.lrec.xml     | 2 +-
 data/xml/K19.xml           | 2 +-
 data/xml/W13.xml           | 2 +-
 data/xml/W16.xml           | 2 +-
 8 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/data/xml/2020.sdp.xml b/data/xml/2020.sdp.xml
index 5d198dd20d..2e3e41d958 100644
--- a/data/xml/2020.sdp.xml
+++ b/data/xml/2020.sdp.xml
@@ -349,7 +349,7 @@
     </paper>
     <paper id="25">
       <title><fixed-case>CIST</fixed-case>@<fixed-case>CL</fixed-case>-<fixed-case>S</fixed-case>ci<fixed-case>S</fixed-case>umm 2020, <fixed-case>L</fixed-case>ong<fixed-case>S</fixed-case>umm 2020: Automatic Scientific Document Summarization</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Yang</first><last>Xie</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index f8b3ca72d9..6dc9353b6c 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -925,7 +925,7 @@
       <title><fixed-case>U</fixed-case>ni<fixed-case>K</fixed-case>eyphrase: A Unified Extraction and Generation Framework for Keyphrase Prediction</title>
       <author><first>Huanqin</first><last>Wu</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Dan</first><last>Nie</last></author>
       <author><first>Tao</first><last>Chen</last></author>
       <author><first>Feng</first><last>Zhang</last></author>
diff --git a/data/xml/2022.aacl.xml b/data/xml/2022.aacl.xml
index 19f589335b..367920f172 100644
--- a/data/xml/2022.aacl.xml
+++ b/data/xml/2022.aacl.xml
@@ -553,7 +553,7 @@
     <paper id="44">
       <title><fixed-case>SAPG</fixed-case>raph: Structure-aware Extractive Summarization for Scientific Papers with Heterogeneous Graph</title>
       <author><first>Siya</first><last>Qi</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Yiyang</first><last>Li</last></author>
       <author><first>Jin</first><last>Jiang</last></author>
       <author><first>Dingxin</first><last>Hu</last></author>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 94322d177d..25af1088c6 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -11942,7 +11942,7 @@ Faster and Smaller Speech Translation without Quality Compromise</title>
       <author><first>Siyi</first><last>Wang</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Kai</first><last>Wang</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Yanquan</first><last>Zhou</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last><affiliation>Beijing University of Posts and Telecommunications</affiliation></author>
       <author><first>Qing</first><last>Yang</last><affiliation>Du Xiaoman Technology(Beijing)</affiliation></author>
       <author><first>Dongliang</first><last>Xu</last><affiliation>Du Xiaoman Technology(Beijing)</affiliation></author>
       <pages>3880-3886</pages>
diff --git a/data/xml/2024.lrec.xml b/data/xml/2024.lrec.xml
index 2b6c32c612..c116dfc772 100644
--- a/data/xml/2024.lrec.xml
+++ b/data/xml/2024.lrec.xml
@@ -9082,7 +9082,7 @@
       <author><first>Qing</first><last>Yang</last></author>
       <author><first>Dongliang</first><last>Xu</last></author>
       <author><first>Yanquan</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Yuze</first><last>Li</last></author>
       <author><first>Yingqi</first><last>Zhu</last></author>
       <pages>8792–8803</pages>
diff --git a/data/xml/K19.xml b/data/xml/K19.xml
index a909084b16..dc6a3cf72c 100644
--- a/data/xml/K19.xml
+++ b/data/xml/K19.xml
@@ -955,7 +955,7 @@
     </paper>
     <paper id="77">
       <title>In Conclusion Not Repetition: Comprehensive Abstractive Summarization with Diversified Attention Based on Determinantal Point Processes</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
       <author><first>Marina</first><last>Litvak</last></author>
       <author><first>Natalia</first><last>Vanetik</last></author>
diff --git a/data/xml/W13.xml b/data/xml/W13.xml
index 351599ba29..910d016091 100644
--- a/data/xml/W13.xml
+++ b/data/xml/W13.xml
@@ -5056,7 +5056,7 @@
     </paper>
     <paper id="5">
       <title><fixed-case>CIST</fixed-case> System Report for <fixed-case>ACL</fixed-case> <fixed-case>M</fixed-case>ulti<fixed-case>L</fixed-case>ing 2013 – Track 1: Multilingual Multi-document Summarization</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Wei</first><last>Heng</last></author>
       <author><first>Jia</first><last>Yu</last></author>
       <author><first>Yu</first><last>Liu</last></author>
diff --git a/data/xml/W16.xml b/data/xml/W16.xml
index 33d4e950d9..944a6fe4c3 100644
--- a/data/xml/W16.xml
+++ b/data/xml/W16.xml
@@ -2289,7 +2289,7 @@
     </paper>
     <paper id="18">
       <title><fixed-case>CIST</fixed-case> System for <fixed-case>CL</fixed-case>-<fixed-case>S</fixed-case>ci<fixed-case>S</fixed-case>umm 2016 Shared Task</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Liyuan</first><last>Mao</last></author>
       <author><first>Yazhao</first><last>Zhang</last></author>
       <author><first>Junqi</first><last>Chi</last></author>

From 2a8b49d27f45ee5e726f496319a03f232979726b Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 03:01:41 +0100
Subject: [PATCH 09/19] typo fix

---
 data/xml/P19.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/data/xml/P19.xml b/data/xml/P19.xml
index 0e563d8546..f954e88bac 100644
--- a/data/xml/P19.xml
+++ b/data/xml/P19.xml
@@ -7853,7 +7853,7 @@
       <author><first>Yunxuan</first><last>Xiao</last></author>
       <author><first>Yanru</first><last>Qu</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li-cmmu"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <author><first>Weinan</first><last>Zhang</last></author>
       <author><first>Yong</first><last>Yu</last></author>
       <pages>6140–6150</pages>

From e00b1c71592bb2d420fcf62c107453e396766a02 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 04:33:08 +0100
Subject: [PATCH 10/19] add papers to more specific lei li based on affiliation
 and CVs/GS matching

---
 data/xml/2020.fnp.xml      | 2 +-
 data/xml/2021.acl.xml      | 2 +-
 data/xml/2021.emnlp.xml    | 2 +-
 data/xml/2021.findings.xml | 2 +-
 data/xml/2021.naacl.xml    | 4 ++--
 data/xml/D19.xml           | 2 +-
 data/xml/W13.xml           | 2 +-
 data/xml/W14.xml           | 2 +-
 data/xml/W17.xml           | 2 +-
 data/xml/W19.xml           | 2 +-
 10 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/data/xml/2020.fnp.xml b/data/xml/2020.fnp.xml
index 30cff5edd3..78b5a1ee7f 100644
--- a/data/xml/2020.fnp.xml
+++ b/data/xml/2020.fnp.xml
@@ -194,7 +194,7 @@
     </paper>
     <paper id="17">
       <title>Extractive Financial Narrative Summarisation based on <fixed-case>DPP</fixed-case>s</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Yafei</first><last>Jiang</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
       <pages>100–104</pages>
diff --git a/data/xml/2021.acl.xml b/data/xml/2021.acl.xml
index a0b841b9de..5e40a51caf 100644
--- a/data/xml/2021.acl.xml
+++ b/data/xml/2021.acl.xml
@@ -11081,7 +11081,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
     <paper id="4">
       <title>Pre-training Methods for Neural Machine Translation</title>
       <author><first>Mingxuan</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <pages>21–25</pages>
       <abstract>This tutorial provides a comprehensive guide to make the most of pre-training for neural machine translation. Firstly, we will briefly introduce the background of NMT, pre-training methodology, and point out the main challenges when applying pre-training for NMT. Then we will focus on analysing the role of pre-training in enhancing the performance of NMT, how to design a better pre-training model for executing specific NMT tasks and how to better integrate the pre-trained model into NMT system. In each part, we will provide examples, discuss training techniques and analyse what is transferred when applying pre-training.</abstract>
       <url hash="bae9900f">2021.acl-tutorials.4</url>
diff --git a/data/xml/2021.emnlp.xml b/data/xml/2021.emnlp.xml
index 587d87fdda..8165009dff 100644
--- a/data/xml/2021.emnlp.xml
+++ b/data/xml/2021.emnlp.xml
@@ -9717,7 +9717,7 @@
       <title>Text <fixed-case>A</fixed-case>uto<fixed-case>A</fixed-case>ugment: Learning Compositional Augmentation Policy for Text Classification</title>
       <author><first>Shuhuai</first><last>Ren</last></author>
       <author><first>Jinchao</first><last>Zhang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Xu</first><last>Sun</last></author>
       <author><first>Jie</first><last>Zhou</last></author>
       <pages>9029–9043</pages>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index 6dc9353b6c..809a2ccb92 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -6725,7 +6725,7 @@
     <paper id="78">
       <title>Leveraging Word-Formation Knowledge for <fixed-case>C</fixed-case>hinese Word Sense Disambiguation</title>
       <author><first>Hua</first><last>Zheng</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Damai</first><last>Dai</last></author>
       <author><first>Deli</first><last>Chen</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
diff --git a/data/xml/2021.naacl.xml b/data/xml/2021.naacl.xml
index 08ce6ff0e0..c896712ba5 100644
--- a/data/xml/2021.naacl.xml
+++ b/data/xml/2021.naacl.xml
@@ -2243,7 +2243,7 @@
     <paper id="165">
       <title>Be Careful about Poisoned Word Embeddings: Exploring the Vulnerability of the Embedding Layers in <fixed-case>NLP</fixed-case> Models</title>
       <author><first>Wenkai</first><last>Yang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Zhiyuan</first><last>Zhang</last></author>
       <author><first>Xuancheng</first><last>Ren</last></author>
       <author><first>Xu</first><last>Sun</last></author>
@@ -5884,7 +5884,7 @@
       <title>Decompose, Fuse and Generate: A Formation-Informed Method for <fixed-case>C</fixed-case>hinese Definition Generation</title>
       <author><first>Hua</first><last>Zheng</last></author>
       <author><first>Damai</first><last>Dai</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Zhifang</first><last>Sui</last></author>
       <author><first>Baobao</first><last>Chang</last></author>
diff --git a/data/xml/D19.xml b/data/xml/D19.xml
index 75635449b7..4b3cf71bd4 100644
--- a/data/xml/D19.xml
+++ b/data/xml/D19.xml
@@ -8707,7 +8707,7 @@ The tutorial will bring researchers and practitioners to be aware of this issue,
       <title>Discreteness in Neural Natural Language Processing</title>
       <author><first>Lili</first><last>Mou</last></author>
       <author><first>Hao</first><last>Zhou</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-cmu"><first>Lei</first><last>Li</last></author>
       <abstract>This tutorial provides a comprehensive guide to the process of discreteness in neural NLP.
 
 As a gentle start, we will briefly introduce the background of deep learning based NLP, where we point out the ubiquitous discreteness of natural language and its challenges in neural information processing. Particularly, we will focus on how such discreteness plays a role in the input space, the latent space, and the output space of a neural network. In each part, we will provide examples, discuss machine learning techniques, as well as demonstrate NLP applications.</abstract>
diff --git a/data/xml/W13.xml b/data/xml/W13.xml
index 910d016091..227482dfaf 100644
--- a/data/xml/W13.xml
+++ b/data/xml/W13.xml
@@ -5020,7 +5020,7 @@
     </frontmatter>
     <paper id="1">
       <title>Multi-document multilingual summarization corpus preparation, Part 1: <fixed-case>A</fixed-case>rabic, <fixed-case>E</fixed-case>nglish, <fixed-case>G</fixed-case>reek, <fixed-case>C</fixed-case>hinese, <fixed-case>R</fixed-case>omanian</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Corina</first><last>Forascu</last></author>
       <author><first>Mahmoud</first><last>El-Haj</last></author>
       <author><first>George</first><last>Giannakopoulos</last></author>
diff --git a/data/xml/W14.xml b/data/xml/W14.xml
index 9cdb41c81d..3fe049893c 100644
--- a/data/xml/W14.xml
+++ b/data/xml/W14.xml
@@ -11786,7 +11786,7 @@
       <author><first>Xiaoyue</first><last>Cong</last></author>
       <author><first>Fang</first><last>Huang</last></author>
       <author><first>Hongfa</first><last>Xue</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Zhiqiao</first><last>Gao</last></author>
       <pages>114–119</pages>
       <url hash="e0444f31">W14-6818</url>
diff --git a/data/xml/W17.xml b/data/xml/W17.xml
index 4e65bc6b2b..20942f770b 100644
--- a/data/xml/W17.xml
+++ b/data/xml/W17.xml
@@ -1679,7 +1679,7 @@
     </paper>
     <paper id="5">
       <title>Word Embedding and Topic Modeling Enhanced Multiple Features for Content Linking and Argument / Sentiment Labeling in Online Forums</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Liyuan</first><last>Mao</last></author>
       <author><first>Moye</first><last>Chen</last></author>
       <pages>32–36</pages>
diff --git a/data/xml/W19.xml b/data/xml/W19.xml
index 0df0123831..518a273da1 100644
--- a/data/xml/W19.xml
+++ b/data/xml/W19.xml
@@ -18512,7 +18512,7 @@ In this tutorial on MT and post-editing we would like to continue sharing the la
     <paper id="4">
       <title>Multi-lingual <fixed-case>W</fixed-case>ikipedia Summarization and Title Generation On Low Resource Corpus</title>
       <author id="wei-liu-kcl"><first>Wei</first><last>Liu</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Zuying</first><last>Huang</last></author>
       <author><first>Yinan</first><last>Liu</last></author>
       <pages>17–25</pages>

From d3b6b0b69b420cb2bece3c800afdb23094cf9cc6 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 04:34:12 +0100
Subject: [PATCH 11/19] adding new `lei-li-zju`

---
 data/yaml/name_variants.yaml | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 7ac2003d36..9c1838889b 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5756,6 +5756,11 @@
   orcid: 0000-0002-3204-6527
   comment: Beijing University of Posts and Telecommunications
   institution: Beijing University of Posts and Telecommunications
+- canonical: {first: Lei, last: Li}
+  id: lei-li-zju
+  orcid: 0000-0002-7456-2204
+  comment: Zhejiang University
+  institution: Zhejiang University
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 9d573559c409b334076ecd584d2c290fbc93d981 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 04:48:26 +0100
Subject: [PATCH 12/19] adding papers to new `lei-li-zju`

based on affiliation displayed, comparison with openreview and g scholar
---
 data/xml/2022.acl.xml      | 2 +-
 data/xml/2022.coling.xml   | 2 +-
 data/xml/2022.emnlp.xml    | 2 +-
 data/xml/2022.findings.xml | 2 +-
 data/xml/2023.ijcnlp.xml   | 2 +-
 data/xml/2024.acl.xml      | 2 +-
 data/xml/2024.findings.xml | 2 +-
 data/xml/2025.acl.xml      | 2 +-
 8 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/data/xml/2022.acl.xml b/data/xml/2022.acl.xml
index 72e6ef489f..aa6e7d6894 100644
--- a/data/xml/2022.acl.xml
+++ b/data/xml/2022.acl.xml
@@ -7423,7 +7423,7 @@ in the Case of Unambiguous Gender</title>
       <author><first>Mosha</first><last>Chen</last></author>
       <author><first>Zhen</first><last>Bi</last></author>
       <author><first>Xiaozhuan</first><last>Liang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last></author>
       <author><first>Xin</first><last>Shang</last></author>
       <author><first>Kangping</first><last>Yin</last></author>
       <author orcid="0000-0002-6676-3057"><first>Chuanqi</first><last>Tan</last></author>
diff --git a/data/xml/2022.coling.xml b/data/xml/2022.coling.xml
index bfdedc0130..7c277651a0 100644
--- a/data/xml/2022.coling.xml
+++ b/data/xml/2022.coling.xml
@@ -2431,7 +2431,7 @@
     <paper id="209">
       <title><fixed-case>L</fixed-case>ight<fixed-case>NER</fixed-case>: A Lightweight Tuning Paradigm for Low-resource <fixed-case>NER</fixed-case> via Pluggable Prompting</title>
       <author><first>Xiang</first><last>Chen</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last></author>
       <author><first>Shumin</first><last>Deng</last></author>
       <author><first>Chuanqi</first><last>Tan</last></author>
       <author><first>Changliang</first><last>Xu</last></author>
diff --git a/data/xml/2022.emnlp.xml b/data/xml/2022.emnlp.xml
index 7517e92f00..903a6ec7d6 100644
--- a/data/xml/2022.emnlp.xml
+++ b/data/xml/2022.emnlp.xml
@@ -11575,7 +11575,7 @@
       <author><first>Xin</first><last>Xie</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Xiang</first><last>Chen</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Zhoubo</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last><affiliation>Zhejiang University</affiliation></author>
       <pages>98-108</pages>
       <abstract>We present an open-source and extensible knowledge extraction toolkit DeepKE, supporting complicated low-resource, document-level and multimodal scenarios in the knowledge base population. DeepKE implements various information extraction tasks, including named entity recognition, relation extraction and attribute extraction. With a unified framework, DeepKE allows developers and researchers to customize datasets and models to extract information from unstructured data according to their requirements. Specifically, DeepKE not only provides various functional modules and model implementation for different tasks and scenarios but also organizes all components by consistent frameworks to maintain sufficient modularity and extensibility. We release the source code at GitHub in <url>https://github.com/zjunlp/DeepKE</url> with Google Colab tutorials and comprehensive documents for beginners. Besides, we present an online system in <url>http://deepke.openkg.cn/EN/re_doc_show.html</url> for real-time extraction of various tasks, and a demo video.</abstract>
       <url hash="6ef4af1e">2022.emnlp-demos.10</url>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 25af1088c6..18f3de968a 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -6196,7 +6196,7 @@
       <title>Good Visual Guidance Make A Better Extractor: Hierarchical Visual Prefix for Multimodal Entity and Relation Extraction</title>
       <author><first>Xiang</first><last>Chen</last></author>
       <author><first>Ningyu</first><last>Zhang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last></author>
       <author><first>Yunzhi</first><last>Yao</last></author>
       <author><first>Shumin</first><last>Deng</last></author>
       <author orcid="0000-0002-6676-3057"><first>Chuanqi</first><last>Tan</last></author>
diff --git a/data/xml/2023.ijcnlp.xml b/data/xml/2023.ijcnlp.xml
index 292a8d1274..a9c9103d62 100644
--- a/data/xml/2023.ijcnlp.xml
+++ b/data/xml/2023.ijcnlp.xml
@@ -1496,7 +1496,7 @@
       <author><first>Pengfei</first><last>Zhu</last></author>
       <author><first>Chao</first><last>Pang</last></author>
       <author><first>Yekun</first><last>Chai</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last></author>
       <author><first>Shuohuan</first><last>Wang</last></author>
       <author><first>Yu</first><last>Sun</last></author>
       <author><first>Hao</first><last>Tian</last></author>
diff --git a/data/xml/2024.acl.xml b/data/xml/2024.acl.xml
index 66a5ff717f..5961854d68 100644
--- a/data/xml/2024.acl.xml
+++ b/data/xml/2024.acl.xml
@@ -13381,7 +13381,7 @@
       <author><first>Ziwen</first><last>Xu</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Shuofei</first><last>Qiao</last></author>
       <author><first>Runnan</first><last>Fang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Zhen</first><last>Bi</last><affiliation>Zhejiang University</affiliation></author>
       <author><first>Guozhou</first><last>Zheng</last></author>
       <author><first>Huajun</first><last>Chen</last><affiliation>Zhejiang University</affiliation></author>
diff --git a/data/xml/2024.findings.xml b/data/xml/2024.findings.xml
index bd20b55e17..a46865543d 100644
--- a/data/xml/2024.findings.xml
+++ b/data/xml/2024.findings.xml
@@ -32433,7 +32433,7 @@ hai-coaching/</abstract>
     <paper id="956">
       <title><fixed-case>H</fixed-case>yper<fixed-case>L</fixed-case>o<fixed-case>RA</fixed-case>: Efficient Cross-task Generalization via Constrained Low-Rank Adapters Generation</title>
       <author><first>Chuancheng</first><last>Lv</last><affiliation>Tsinghua University, Tsinghua University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Shitou</first><last>Zhang</last></author>
       <author orcid="0000-0002-6671-2903"><first>Gang</first><last>Chen</last></author>
       <author orcid="0000-0002-4400-4033"><first>Fanchao</first><last>Qi</last></author>
diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index f8b0c3ebc7..996fc761d3 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -17060,7 +17060,7 @@
     </paper>
     <paper id="1169">
       <title>Uncertainty-Aware Iterative Preference Optimization for Enhanced <fixed-case>LLM</fixed-case> Reasoning</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
+      <author id="lei-li-zju"><first>Lei</first><last>Li</last><affiliation>Tencent</affiliation></author>
       <author><first>Hehuan</first><last>Liu</last></author>
       <author orcid="0009-0004-2935-0749"><first>Yaxin</first><last>Zhou</last></author>
       <author><first>ZhaoYang</first><last>Gui</last><affiliation>Tencent</affiliation></author>

From e42139e0c5606b07392af4a8fee21dc4f98b2305 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 04:58:07 +0100
Subject: [PATCH 13/19] add new `lei-li-hkbu`

Lei_Li19 on OR
---
 data/yaml/name_variants.yaml | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 9c1838889b..2cf5889c04 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5751,6 +5751,11 @@
   orcid: 0009-0008-6984-5104
   comment: University of Hong Kong
   institution: University of Hong Kong
+- canonical: {first: Lei, last: Li}
+  id: lei-li-hkbu
+  orcid: 0000-0002-5631-2519
+  comment: Hong Kong Baptist University
+  institution: Hong Kong Baptist University
 - canonical: {first: Lei, last: Li}
   id: lei-li-bupt
   orcid: 0000-0002-3204-6527

From 0fb1bced1c584ef5dba5faf2de6e3fabf37273be Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 04:58:41 +0100
Subject: [PATCH 14/19] add papers to new `lei-li-hkbu`

using OpenReview and OpenReview
---
 data/xml/2021.acl.xml    | 2 +-
 data/xml/2022.acl.xml    | 2 +-
 data/xml/2022.coling.xml | 2 +-
 data/xml/2024.ccl.xml    | 2 +-
 data/xml/2024.lrec.xml   | 2 +-
 5 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/data/xml/2021.acl.xml b/data/xml/2021.acl.xml
index 5e40a51caf..5d70b7cf8c 100644
--- a/data/xml/2021.acl.xml
+++ b/data/xml/2021.acl.xml
@@ -5370,7 +5370,7 @@ The source code has been made available at \url{https://github.com/liam0949/DCLO
     </paper>
     <paper id="383">
       <title>Personalized Transformer for Explainable Recommendation</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hkbu"><first>Lei</first><last>Li</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <author><first>Li</first><last>Chen</last></author>
       <pages>4947–4957</pages>
diff --git a/data/xml/2022.acl.xml b/data/xml/2022.acl.xml
index aa6e7d6894..985472c1c4 100644
--- a/data/xml/2022.acl.xml
+++ b/data/xml/2022.acl.xml
@@ -278,7 +278,7 @@
       <author><first>Shijie</first><last>Geng</last></author>
       <author><first>Zuohui</first><last>Fu</last></author>
       <author><first>Yingqiang</first><last>Ge</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hkbu"><first>Lei</first><last>Li</last></author>
       <author orcid="0000-0002-2930-2059"><first>Gerard</first><last>de Melo</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <pages>244-255</pages>
diff --git a/data/xml/2022.coling.xml b/data/xml/2022.coling.xml
index 7c277651a0..83cca481e5 100644
--- a/data/xml/2022.coling.xml
+++ b/data/xml/2022.coling.xml
@@ -2759,7 +2759,7 @@
       <title>Augmenting Legal Judgment Prediction with Contrastive Case Relations</title>
       <author><first>Dugang</first><last>Liu</last></author>
       <author><first>Weihao</first><last>Du</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hkbu"><first>Lei</first><last>Li</last></author>
       <author><first>Weike</first><last>Pan</last></author>
       <author><first>Zhong</first><last>Ming</last></author>
       <pages>2658–2667</pages>
diff --git a/data/xml/2024.ccl.xml b/data/xml/2024.ccl.xml
index 44aa040fb4..c505a9ce20 100644
--- a/data/xml/2024.ccl.xml
+++ b/data/xml/2024.ccl.xml
@@ -1070,7 +1070,7 @@
       <author><first>Yuelou</first><last>Xu</last></author>
       <author><first>Yan</first><last>Lu</last></author>
       <author><first>Kai</first><last>Wang</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-bupt"><first>Lei</first><last>Li</last></author>
       <author><first>Yanquan</first><last>Zhou</last></author>
       <pages>1123–1135</pages>
       <abstract>“The zero-resource cross-domain named entity recognition (NER) task aims to perform NER in aspecific domain where labeled data is unavailable. Existing methods primarily focus on transfer-ring NER knowledge from high-resource to zero-resource domains. However, the challenge liesin effectively transferring NER knowledge between domains due to the inherent differences inentity structures across domains. To tackle this challenge, we propose an Unsupervised DomainAdaptation Adversarial (UDAA) framework, which combines the masked language model auxil-iary task with the domain adaptive adversarial network to mitigate inter-domain differences andefficiently facilitate knowledge transfer. Experimental results on CBS, Twitter, and WNUT2016three datasets demonstrate the effectiveness of our framework. Notably, we achieved new state-of-the-art performance on the three datasets. Our code will be released.Introduction”</abstract>
diff --git a/data/xml/2024.lrec.xml b/data/xml/2024.lrec.xml
index c116dfc772..6a0ace7ce1 100644
--- a/data/xml/2024.lrec.xml
+++ b/data/xml/2024.lrec.xml
@@ -10424,7 +10424,7 @@
     </paper>
     <paper id="886">
       <title>Large Language Models for Generative Recommendation: A Survey and Visionary Discussions</title>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hkbu"><first>Lei</first><last>Li</last></author>
       <author><first>Yongfeng</first><last>Zhang</last></author>
       <author><first>Dugang</first><last>Liu</last></author>
       <author><first>Li</first><last>Chen</last></author>

From 90492a02b05100e114fc8a4f22136a71d5304773 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 05:04:57 +0100
Subject: [PATCH 15/19] add new `lei-li-renmin` plus only paper

OR Lei_Li42
---
 data/xml/2025.findings.xml   | 2 +-
 data/yaml/name_variants.yaml | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/data/xml/2025.findings.xml b/data/xml/2025.findings.xml
index 7d74c6c282..49010d3c3c 100644
--- a/data/xml/2025.findings.xml
+++ b/data/xml/2025.findings.xml
@@ -43657,7 +43657,7 @@
     </paper>
     <paper id="1305">
       <title><fixed-case>A</fixed-case>uto<fixed-case>MIR</fixed-case>: Effective Zero-Shot Medical Information Retrieval without Relevance Labels</title>
-      <author orcid="0000-0001-5660-0409" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0001-5660-0409" id="lei-li-renmin"><first>Lei</first><last>Li</last></author>
       <author orcid="0009-0006-0306-8168"><first>Xiangxu</first><last>Zhang</last><affiliation>Renmin University of China</affiliation></author>
       <author orcid="0000-0002-0868-764X"><first>Xiao</first><last>Zhou</last></author>
       <author orcid="0000-0001-7765-8466"><first>Zheng</first><last>Liu</last></author>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 2cf5889c04..2ff2f26a76 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5766,6 +5766,11 @@
   orcid: 0000-0002-7456-2204
   comment: Zhejiang University
   institution: Zhejiang University
+- canonical: {first: Lei, last: Li}
+  id: lei-li-renmin
+  orcid: 0000-0001-5660-0409
+  comment: Renmin University
+  institution: Renmin University
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 78a5c6ec089f6ce61695e80c11d9d50a575903bb Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 05:19:24 +0100
Subject: [PATCH 16/19] add new `lei-li-ecnu` plus papers

OR Lei_Li29 , dblp.org/pid/13/7007-43
---
 data/xml/2022.emnlp.xml      | 2 +-
 data/xml/2022.findings.xml   | 2 +-
 data/xml/2023.acl.xml        | 2 +-
 data/yaml/name_variants.yaml | 5 +++++
 4 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/data/xml/2022.emnlp.xml b/data/xml/2022.emnlp.xml
index 903a6ec7d6..5f6ea5d0bd 100644
--- a/data/xml/2022.emnlp.xml
+++ b/data/xml/2022.emnlp.xml
@@ -11465,7 +11465,7 @@
       <author><first>Minghui</first><last>Qiu</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Taolin</first><last>Zhang</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Tingting</first><last>Liu</last><affiliation>East China Normal University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li-ecnu"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Jianing</first><last>Wang</last><affiliation>East China Normal University</affiliation></author>
       <author id="ming-wang"><first>Ming</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Jun</first><last>Huang</last><affiliation>Alibaba Group</affiliation></author>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index 18f3de968a..8a4431f5dc 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -8908,7 +8908,7 @@
       <author><first>Tingting</first><last>Liu</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Chengyu</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Xiangru</first><last>Zhu</last><affiliation>Fudan University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li-ecnu"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Minghui</first><last>Qiu</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Jun</first><last>Huang</last><affiliation>alibaba group</affiliation></author>
       <author><first>Ming</first><last>Gao</last><affiliation>East China Normal University</affiliation></author>
diff --git a/data/xml/2023.acl.xml b/data/xml/2023.acl.xml
index 22590a6adf..2f960a6715 100644
--- a/data/xml/2023.acl.xml
+++ b/data/xml/2023.acl.xml
@@ -16901,7 +16901,7 @@
       <title><fixed-case>F</fixed-case>ashion<fixed-case>KLIP</fixed-case>: Enhancing <fixed-case>E</fixed-case>-Commerce Image-Text Retrieval with Fashion Multi-Modal Conceptual Knowledge Graph</title>
       <author><first>Xiaodan</first><last>Wang</last><affiliation>Fudan University</affiliation></author>
       <author><first>Chengyu</first><last>Wang</last><affiliation>Alibaba Group</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
+      <author id="lei-li-ecnu"><first>Lei</first><last>Li</last><affiliation>East China Normal University</affiliation></author>
       <author><first>Zhixu</first><last>Li</last><affiliation>Fudan University</affiliation></author>
       <author><first>Ben</first><last>Chen</last><affiliation>Alibaba Group</affiliation></author>
       <author><first>Linbo</first><last>Jin</last><affiliation>Alibaba</affiliation></author>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 2ff2f26a76..83b0351cb3 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5771,6 +5771,11 @@
   orcid: 0000-0001-5660-0409
   comment: Renmin University
   institution: Renmin University
+- canonical: {first: Lei, last: Li}
+  id: lei-li-ecnu
+  orcid: 0000-0002-8891-1786
+  comment: ECNU
+  institution: East China Normal University
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 573b6132b9715ae06e0714757481876acfac62e9 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 05:47:04 +0100
Subject: [PATCH 17/19] add new `lei-li-ucph` plus papers

---
 data/xml/2023.emnlp.xml      | 2 +-
 data/xml/2023.findings.xml   | 6 +++---
 data/xml/2025.acl.xml        | 2 +-
 data/xml/2025.findings.xml   | 6 +++---
 data/yaml/name_variants.yaml | 5 +++++
 5 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/data/xml/2023.emnlp.xml b/data/xml/2023.emnlp.xml
index 1455cdd5b6..056292e4c9 100644
--- a/data/xml/2023.emnlp.xml
+++ b/data/xml/2023.emnlp.xml
@@ -4156,7 +4156,7 @@
     <paper id="296">
       <title>Can We Edit Factual Knowledge by In-Context Learning?</title>
       <author><first>Ce</first><last>Zheng</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
       <author><first>Yuxuan</first><last>Fan</last></author>
       <author><first>Zhiyong</first><last>Wu</last></author>
diff --git a/data/xml/2023.findings.xml b/data/xml/2023.findings.xml
index 08375137ea..99b00022b8 100644
--- a/data/xml/2023.findings.xml
+++ b/data/xml/2023.findings.xml
@@ -7044,7 +7044,7 @@
       <title>Communication Efficient Federated Learning for Multilingual Neural Machine Translation with Adapter</title>
       <author><first>Yi</first><last>Liu</last><affiliation>School of Computer Science, Peking University</affiliation></author>
       <author><first>Xiaohan</first><last>Bi</last><affiliation>Peking University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author><first>Sishuo</first><last>Chen</last><affiliation>Center for Data Science, Peking University</affiliation></author>
       <author orcid="0000-0003-1942-7998"><first>Wenkai</first><last>Yang</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0001-8241-9320"><first>Xu</first><last>Sun</last><affiliation>Peking University</affiliation></author>
@@ -10714,7 +10714,7 @@
     <paper id="610">
       <title>Delving into the Openness of <fixed-case>CLIP</fixed-case></title>
       <author><first>Shuhuai</first><last>Ren</last><affiliation>Peking University</affiliation></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last><affiliation>Peking University</affiliation></author>
       <author orcid="0000-0002-6994-2114"><first>Xuancheng</first><last>Ren</last><affiliation>DAMO Academy, Alibaba Group</affiliation></author>
       <author orcid="0000-0002-3046-512X"><first>Guangxiang</first><last>Zhao</last><affiliation>Shanghai AI lab</affiliation></author>
       <author orcid="0000-0001-8241-9320"><first>Xu</first><last>Sun</last><affiliation>Peking University</affiliation></author>
@@ -16398,7 +16398,7 @@
       <title><fixed-case>I</fixed-case>mage<fixed-case>N</fixed-case>et<fixed-case>VC</fixed-case>: Zero- and Few-Shot Visual Commonsense Evaluation on 1000 <fixed-case>I</fixed-case>mage<fixed-case>N</fixed-case>et Categories</title>
       <author><first>Heming</first><last>Xia</last></author>
       <author><first>Qingxiu</first><last>Dong</last></author>
-      <author id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author id="lei-li-hku"><first>Lei</first><last>Li</last></author>
       <author><first>Jingjing</first><last>Xu</last></author>
       <author><first>Tianyu</first><last>Liu</last></author>
       <author><first>Ziwei</first><last>Qin</last></author>
diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index 996fc761d3..f0faf01d79 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -11968,7 +11968,7 @@
       <author orcid="0000-0003-4183-7053"><first>Tianfang</first><last>Zhang</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Zongkai</first><last>Wu</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucp"><first>Lei</first><last>Li</last></author>
       <pages>16780-16790</pages>
       <abstract>Large Language Models (LLMs) have demonstrated impressive capabilities in reasoning tasks, yet their reliance on static prompt structures and limited adaptability to complex scenarios remains a major challenge. In this paper, we propose the **Deductive and Inductive (DID)** method, a novel framework that enhances LLM reasoning by dynamically integrating both deductive and inductive reasoning approaches. Drawing from cognitive science principles, DID implements a dual-metric complexity evaluation system that combines Littlestone dimension and information entropy to precisely assess task difficulty and guide decomposition strategies. DID enables the model to progressively adapt its reasoning pathways based on problem complexity, mirroring human cognitive processes. We evaluate DID’s effectiveness across multiple benchmarks, including the AIW, MR-GSM8K, and our custom Holiday Puzzle dataset for temporal reasoning. Our results demonstrate great improvements in reasoning quality and solution accuracy - achieving 70.3% accuracy on AIW (compared to 62.2% for Tree of Thought), while maintaining lower computational costs.</abstract>
       <url hash="41c46401">2025.acl-long.820</url>
diff --git a/data/xml/2025.findings.xml b/data/xml/2025.findings.xml
index 49010d3c3c..d6309fe740 100644
--- a/data/xml/2025.findings.xml
+++ b/data/xml/2025.findings.xml
@@ -13785,7 +13785,7 @@
       <author><first>Zongkai</first><last>Wu</last></author>
       <author orcid="0000-0002-0914-2975"><first>John</first><last>Lee</last><affiliation>University of Edinburgh, University of Edinburgh</affiliation></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucph"><first>Lei</first><last>Li</last></author>
       <pages>10045-10056</pages>
       <abstract>In the rapidly evolving field of image generation, achieving precise control over generated content and maintaining semantic consistency remain significant limitations, particularly concerning grounding techniques and the necessity for model fine-tuning. To address these challenges, we propose BayesGenie, an off-the-shelf approach that integrates Large Language Models (LLMs) with Bayesian Optimization to facilitate precise and user-friendly image editing. Our method enables users to modify images through natural language descriptions without manual area marking, while preserving the original image’s semantic integrity. Unlike existing techniques that require extensive pre-training or fine-tuning, our approach demonstrates remarkable adaptability across various LLMs through its model-agnostic design. BayesGenie employs an adapted Bayesian optimization strategy to automatically refine the inference process parameters, achieving high-precision image editing with minimal user intervention. Through extensive experiments across diverse scenarios, we demonstrate that our framework outperforms existing methods in both editing accuracy and semantic preservation, as validated using different LLMs including Claude3 and GPT-4.</abstract>
       <url hash="e2f4f1c6">2025.findings-acl.523</url>
@@ -27104,7 +27104,7 @@
       <author><first>Jinyuan</first><last>Xu</last></author>
       <author><first>Xue</first><last>He</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucp"><first>Lei</first><last>Li</last></author>
       <pages>1736-1750</pages>
       <abstract>Understanding the decision-making processes of large language models (LLMs) is essential for their trustworthy development and deployment, however, current interpretability methods often face challenges such as low resolution and high computational cost. To address these limitations, we propose the Multi-Layer Attention Consistency Score (MACS), a novel, lightweight, and easily deployable heuristic for estimating the importance of input tokens in decoder-based models. MACS measures contributions of input tokens based on the consistency of maximal attention. Empirical evaluations demonstrate that MACS achieves a favorable trade-off between interpretability quality and computational efficiency, showing faithfulness comparable to complex techniques with a 22% decrease in VRAM usage and 30% reduction in latency.</abstract>
       <url hash="eb70da57">2025.findings-emnlp.91</url>
@@ -28380,7 +28380,7 @@
       <author><first>Xinglin</first><last>Zhang</last><affiliation>Medical Image Insights</affiliation></author>
       <author><first>Tao</first><last>Chen</last><affiliation>University of Waterloo</affiliation></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucph"><first>Lei</first><last>Li</last></author>
       <pages>3456-3467</pages>
       <abstract>Contrast-enhanced 3D Medical imaging (e.g., CT, MRI) leverages phase sequences to uncover temporal dynamics vital for diagnosing tumors, lesions, and vascular issues. However, current retrieval models primarily focus on spatial features, neglecting phase-specific progression detailed in clinical reports. We present the **Phase-aware Memory Network (PAMN)**, a novel framework enhancing 3D medical image retrieval by fusing imaging phases with diagnostic text. PAMN creates rich radiological representations that enhance diagnostic accuracy by combining image details with clinical report context, rigorously tested on a novel phase-series dataset of 12,230 hospital CT scans. PAMN achieves an effective balance of performance and scalability in 3D radiology retrieval, outperforming state-of-the-art baselines through the robust fusion of spatial, temporal, and textual information.</abstract>
       <url hash="61fe4336">2025.findings-emnlp.184</url>
diff --git a/data/yaml/name_variants.yaml b/data/yaml/name_variants.yaml
index 83b0351cb3..6ca575802e 100644
--- a/data/yaml/name_variants.yaml
+++ b/data/yaml/name_variants.yaml
@@ -5776,6 +5776,11 @@
   orcid: 0000-0002-8891-1786
   comment: ECNU
   institution: East China Normal University
+- canonical: {first: Lei, last: Li}
+  id: lei-li-ucph
+  orcid: 0000-0002-2929-0828
+  comment: University of Copenhagen
+  institution: University of Copenhagen
 - canonical: {first: Shih-Min, last: Li}
   variants:
   - {first: Shi-Min, last: Li}

From 5f19668fbc1e4db547aff1aa360120849b2ea677 Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 06:00:26 +0100
Subject: [PATCH 18/19] forgot 1 letter

---
 data/xml/2025.acl.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index f0faf01d79..b6c5557d7a 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -11968,7 +11968,7 @@
       <author orcid="0000-0003-4183-7053"><first>Tianfang</first><last>Zhang</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Zongkai</first><last>Wu</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li-ucp"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucph"><first>Lei</first><last>Li</last></author>
       <pages>16780-16790</pages>
       <abstract>Large Language Models (LLMs) have demonstrated impressive capabilities in reasoning tasks, yet their reliance on static prompt structures and limited adaptability to complex scenarios remains a major challenge. In this paper, we propose the **Deductive and Inductive (DID)** method, a novel framework that enhances LLM reasoning by dynamically integrating both deductive and inductive reasoning approaches. Drawing from cognitive science principles, DID implements a dual-metric complexity evaluation system that combines Littlestone dimension and information entropy to precisely assess task difficulty and guide decomposition strategies. DID enables the model to progressively adapt its reasoning pathways based on problem complexity, mirroring human cognitive processes. We evaluate DID’s effectiveness across multiple benchmarks, including the AIW, MR-GSM8K, and our custom Holiday Puzzle dataset for temporal reasoning. Our results demonstrate great improvements in reasoning quality and solution accuracy - achieving 70.3% accuracy on AIW (compared to 62.2% for Tree of Thought), while maintaining lower computational costs.</abstract>
       <url hash="41c46401">2025.acl-long.820</url>

From edb7a0155ce94b1b28f9bf02e6fb0d3555dec9cb Mon Sep 17 00:00:00 2001
From: weissenh <50957092+weissenh@users.noreply.github.com>
Date: Fri, 7 Nov 2025 06:00:26 +0100
Subject: [PATCH 19/19] forgot 1 letter

---
 data/xml/2025.acl.xml      | 2 +-
 data/xml/2025.findings.xml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/data/xml/2025.acl.xml b/data/xml/2025.acl.xml
index f0faf01d79..b6c5557d7a 100644
--- a/data/xml/2025.acl.xml
+++ b/data/xml/2025.acl.xml
@@ -11968,7 +11968,7 @@
       <author orcid="0000-0003-4183-7053"><first>Tianfang</first><last>Zhang</last><affiliation>Tsinghua University</affiliation></author>
       <author><first>Zongkai</first><last>Wu</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li-ucp"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucph"><first>Lei</first><last>Li</last></author>
       <pages>16780-16790</pages>
       <abstract>Large Language Models (LLMs) have demonstrated impressive capabilities in reasoning tasks, yet their reliance on static prompt structures and limited adaptability to complex scenarios remains a major challenge. In this paper, we propose the **Deductive and Inductive (DID)** method, a novel framework that enhances LLM reasoning by dynamically integrating both deductive and inductive reasoning approaches. Drawing from cognitive science principles, DID implements a dual-metric complexity evaluation system that combines Littlestone dimension and information entropy to precisely assess task difficulty and guide decomposition strategies. DID enables the model to progressively adapt its reasoning pathways based on problem complexity, mirroring human cognitive processes. We evaluate DID’s effectiveness across multiple benchmarks, including the AIW, MR-GSM8K, and our custom Holiday Puzzle dataset for temporal reasoning. Our results demonstrate great improvements in reasoning quality and solution accuracy - achieving 70.3% accuracy on AIW (compared to 62.2% for Tree of Thought), while maintaining lower computational costs.</abstract>
       <url hash="41c46401">2025.acl-long.820</url>
diff --git a/data/xml/2025.findings.xml b/data/xml/2025.findings.xml
index d6309fe740..0ba8e26440 100644
--- a/data/xml/2025.findings.xml
+++ b/data/xml/2025.findings.xml
@@ -27104,7 +27104,7 @@
       <author><first>Jinyuan</first><last>Xu</last></author>
       <author><first>Xue</first><last>He</last></author>
       <author><first>Jenq-Neng</first><last>Hwang</last></author>
-      <author orcid="0000-0002-2929-0828" id="lei-li-ucp"><first>Lei</first><last>Li</last></author>
+      <author orcid="0000-0002-2929-0828" id="lei-li-ucph"><first>Lei</first><last>Li</last></author>
       <pages>1736-1750</pages>
       <abstract>Understanding the decision-making processes of large language models (LLMs) is essential for their trustworthy development and deployment, however, current interpretability methods often face challenges such as low resolution and high computational cost. To address these limitations, we propose the Multi-Layer Attention Consistency Score (MACS), a novel, lightweight, and easily deployable heuristic for estimating the importance of input tokens in decoder-based models. MACS measures contributions of input tokens based on the consistency of maximal attention. Empirical evaluations demonstrate that MACS achieves a favorable trade-off between interpretability quality and computational efficiency, showing faithfulness comparable to complex techniques with a 22% decrease in VRAM usage and 30% reduction in latency.</abstract>
       <url hash="eb70da57">2025.findings-emnlp.91</url>