Skip to content

Commit 46cbe60

Browse files
smallv0221tianxin
andauthored
Add finetuned ernie gram (#1814)
* add finetuned ernie-gram model * add finetuned ernie-gram model Co-authored-by: tianxin <[email protected]>
1 parent 0a29889 commit 46cbe60

File tree

3 files changed

+30
-1
lines changed

3 files changed

+30
-1
lines changed

docs/model_zoo/transformers.rst

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -329,6 +329,11 @@ Transformer预训练模型汇总
329329
|ERNIE-GRAM_ |``ernie-gram-zh`` | Chinese | 12-layer, 768-hidden, |
330330
| | | | 12-heads, 108M parameters. |
331331
| | | | Trained on Chinese text. |
332+
+ +----------------------------------------------------------------------------------+--------------+-----------------------------------------+
333+
| |``ernie-gram-zh-finetuned-dureader-robust`` | Chinese | 12-layer, 768-hidden, |
334+
| | | | 12-heads, 108M parameters. |
335+
| | | | Trained on Chinese text. |
336+
| | | | Then finetuned on dreader-robust |
332337
+--------------------+----------------------------------------------------------------------------------+--------------+-----------------------------------------+
333338
|GPT_ |``gpt-cpm-large-cn`` | Chinese | 32-layer, 2560-hidden, |
334339
| | | | 32-heads, 2.6B parameters. |

paddlenlp/transformers/ernie_gram/modeling.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,12 +98,27 @@ class ErnieGramPretrainedModel(PretrainedModel):
9898
"type_vocab_size": 2,
9999
"vocab_size": 18018
100100
},
101+
"ernie-gram-zh-finetuned-dureader-robust": {
102+
"attention_probs_dropout_prob": 0.1,
103+
"emb_size": 768,
104+
"hidden_act": "gelu",
105+
"hidden_dropout_prob": 0.1,
106+
"hidden_size": 768,
107+
"initializer_range": 0.02,
108+
"max_position_embeddings": 512,
109+
"num_attention_heads": 12,
110+
"num_hidden_layers": 12,
111+
"type_vocab_size": 2,
112+
"vocab_size": 18018
113+
},
101114
}
102115
resource_files_names = {"model_state": "model_state.pdparams"}
103116
pretrained_resource_files_map = {
104117
"model_state": {
105118
"ernie-gram-zh":
106119
"https://bj.bcebos.com/paddlenlp/models/transformers/ernie_gram_zh/ernie_gram_zh.pdparams",
120+
"ernie-gram-zh-finetuned-dureader-robust":
121+
"https://bj.bcebos.com/paddlenlp/models/transformers/ernie-gram-zh-finetuned-dureader-robust/model_state.pdparams",
107122
},
108123
}
109124
base_model_prefix = "ernie_gram"

paddlenlp/transformers/ernie_gram/tokenizer.py

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -77,9 +77,18 @@ class ErnieGramTokenizer(ErnieTokenizer):
7777
"vocab_file": {
7878
"ernie-gram-zh":
7979
"https://bj.bcebos.com/paddlenlp/models/transformers/ernie_gram_zh/vocab.txt",
80+
"ernie-gram-zh-finetuned-dureader-robust":
81+
"https://bj.bcebos.com/paddlenlp/models/transformers/ernie_gram_zh/vocab.txt",
8082
}
8183
}
82-
pretrained_init_configuration = {"ernie-gram-zh": {"do_lower_case": True}, }
84+
pretrained_init_configuration = {
85+
"ernie-gram-zh": {
86+
"do_lower_case": True
87+
},
88+
"ernie-gram-zh-finetuned-dureader-robust": {
89+
"do_lower_case": True
90+
},
91+
}
8392

8493
def __init__(self,
8594
vocab_file,

0 commit comments

Comments
 (0)