@@ -821,7 +821,7 @@ class ErniePretrainedModel(PretrainedModel):
821
821
"num_hidden_layers" : 12 ,
822
822
"task_type_vocab_size" : 3 ,
823
823
"type_vocab_size" : 4 ,
824
- "use_task_id" : True ,
824
+ "use_task_id" : False ,
825
825
"vocab_size" : 40000 ,
826
826
},
827
827
"ernie-3.0-tiny-medium-v2" : {
@@ -836,7 +836,7 @@ class ErniePretrainedModel(PretrainedModel):
836
836
"num_hidden_layers" : 6 ,
837
837
"task_type_vocab_size" : 16 ,
838
838
"type_vocab_size" : 4 ,
839
- "use_task_id" : True ,
839
+ "use_task_id" : False ,
840
840
"vocab_size" : 40000 ,
841
841
},
842
842
"ernie-3.0-tiny-mini-v2" : {
@@ -851,7 +851,7 @@ class ErniePretrainedModel(PretrainedModel):
851
851
"num_hidden_layers" : 6 ,
852
852
"task_type_vocab_size" : 16 ,
853
853
"type_vocab_size" : 4 ,
854
- "use_task_id" : True ,
854
+ "use_task_id" : False ,
855
855
"vocab_size" : 40000 ,
856
856
},
857
857
"ernie-3.0-tiny-micro-v2" : {
@@ -866,7 +866,7 @@ class ErniePretrainedModel(PretrainedModel):
866
866
"num_hidden_layers" : 4 ,
867
867
"task_type_vocab_size" : 16 ,
868
868
"type_vocab_size" : 4 ,
869
- "use_task_id" : True ,
869
+ "use_task_id" : False ,
870
870
"vocab_size" : 40000 ,
871
871
},
872
872
"ernie-3.0-tiny-nano-v2" : {
@@ -881,22 +881,22 @@ class ErniePretrainedModel(PretrainedModel):
881
881
"num_hidden_layers" : 4 ,
882
882
"task_type_vocab_size" : 16 ,
883
883
"type_vocab_size" : 4 ,
884
- "use_task_id" : True ,
884
+ "use_task_id" : False ,
885
885
"vocab_size" : 40000 ,
886
886
},
887
887
"ernie-3.0-tiny-pico-v2" : {
888
888
"attention_probs_dropout_prob" : 0.1 ,
889
889
"hidden_act" : "gelu" ,
890
890
"hidden_dropout_prob" : 0.1 ,
891
891
"hidden_size" : 128 ,
892
- "intermediate_size" : 1248 ,
892
+ "intermediate_size" : 512 ,
893
893
"initializer_range" : 0.02 ,
894
894
"max_position_embeddings" : 2048 ,
895
895
"num_attention_heads" : 2 ,
896
896
"num_hidden_layers" : 3 ,
897
897
"task_type_vocab_size" : 16 ,
898
898
"type_vocab_size" : 4 ,
899
- "use_task_id" : True ,
899
+ "use_task_id" : False ,
900
900
"vocab_size" : 40000 ,
901
901
},
902
902
}
0 commit comments