Skip to content

Commit 0e4a168

Browse files
authored
Add camembert model (#1034)
1 parent cefcadf commit 0e4a168

File tree

8 files changed

+2028
-0
lines changed

8 files changed

+2028
-0
lines changed

mindone/transformers/__init__.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -120,6 +120,16 @@
120120
Blip2QFormerModel,
121121
Blip2VisionModel,
122122
)
123+
from .models.camembert import (
124+
CamembertForCausalLM,
125+
CamembertForMaskedLM,
126+
CamembertForMultipleChoice,
127+
CamembertForQuestionAnswering,
128+
CamembertForSequenceClassification,
129+
CamembertForTokenClassification,
130+
CamembertModel,
131+
CamembertPreTrainedModel,
132+
)
123133
from .models.chameleon import (
124134
ChameleonForConditionalGeneration,
125135
ChameleonModel,

mindone/transformers/models/__init__.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@
2828
bit,
2929
blip,
3030
blip_2,
31+
camembert,
3132
clap,
3233
clip,
3334
dpt,

mindone/transformers/models/auto/configuration_auto.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,7 @@
6060
("granitemoeshared", "GraniteMoeSharedConfig"),
6161
("helium", "HeliumConfig"),
6262
("hiera", "HieraConfig"),
63+
("camembert", "CamembertConfig"),
6364
("idefics", "IdeficsConfig"),
6465
("idefics2", "Idefics2Config"),
6566
("idefics3", "Idefics3Config"),
@@ -111,6 +112,7 @@
111112
("aria_text", "AriaText"),
112113
("bert", "BERT"),
113114
("bart", "BART"),
115+
("camembert", "CamemBERT"),
114116
("bit", "BiT"),
115117
("blip", "BLIP"),
116118
("blip-2", "BLIP-2"),

mindone/transformers/models/auto/modeling_auto.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -37,6 +37,7 @@
3737
("aria_text", "AriaTextModel"),
3838
("bert", "BertModel"),
3939
("bart", "BartModel"),
40+
("camembert", "CamembertModel"),
4041
("bit", "BitModel"),
4142
("blip", "BlipModel"),
4243
("blip-2", "Blip2Model"),
@@ -106,6 +107,7 @@
106107
# Model for pre-training mapping
107108
("albert", "AlbertForPreTraining"),
108109
("bart", "BartForConditionalGeneration"),
110+
("camembert", "CamembertForMaskedLM"),
109111
("bert", "BertForPreTraining"),
110112
("gpt2", "GPT2LMHeadModel"),
111113
("gemma3", "Gemma3ForConditionalGeneration"),
@@ -137,6 +139,7 @@
137139
("deberta-v2", "DebertaV2ForMaskedLM"),
138140
("gpt2", "GPT2LMHeadModel"),
139141
("led", "LEDForConditionalGeneration"),
142+
("camembert", "CamembertForMaskedLM"),
140143
("roberta", "RobertaForMaskedLM"),
141144
("megatron-bert", "MegatronBertForCausalLM"),
142145
("mobilebert", "MobileBertForMaskedLM"),
@@ -155,6 +158,7 @@
155158
# Model for Causal LM mapping
156159
("aria_text", "AriaTextForCausalLM"),
157160
("bart", "BartForCausalLM"),
161+
("camembert", "CamembertForCausalLM"),
158162
("bert", "BertLMHeadModel"),
159163
("bert-generation", "BertGenerationDecoder"),
160164
("gemma", "GemmaForCausalLM"),
@@ -274,6 +278,7 @@
274278
("bart", "BartForConditionalGeneration"),
275279
("bert", "BertForMaskedLM"),
276280
("roberta", "RobertaForMaskedLM"),
281+
("camembert", "CamembertForMaskedLM"),
277282
("deberta", "DebertaForMaskedLM"),
278283
("deberta-v2", "DebertaV2ForMaskedLM"),
279284
("mobilebert", "MobileBertForMaskedLM"),
@@ -340,6 +345,7 @@
340345
# Model for Sequence Classification mapping
341346
("albert", "AlbertForSequenceClassification"),
342347
("bart", "BartForSequenceClassification"),
348+
("camembert", "CamembertForSequenceClassification"),
343349
("bert", "BertForSequenceClassification"),
344350
("roberta", "RobertaForSequenceClassification"),
345351
("deberta", "DebertaForSequenceClassification"),
@@ -373,6 +379,7 @@
373379
("albert", "AlbertForQuestionAnswering"),
374380
("bart", "BartForQuestionAnswering"),
375381
("bert", "BertForQuestionAnswering"),
382+
("camembert", "CamembertForQuestionAnswering"),
376383
("roberta", "RobertaForQuestionAnswering"),
377384
("deberta", "DebertaForQuestionAnswering"),
378385
("deberta-v2", "DebertaV2ForQuestionAnswering"),
@@ -407,6 +414,7 @@
407414
# Model for Token Classification mapping
408415
("albert", "AlbertForTokenClassification"),
409416
("bert", "BertForTokenClassification"),
417+
("camembert", "CamembertForTokenClassification"),
410418
("deberta", "DebertaForTokenClassification"),
411419
("deberta-v2", "DebertaV2ForTokenClassification"),
412420
("glm", "GlmForTokenClassification"),
@@ -433,6 +441,7 @@
433441
MODEL_FOR_MULTIPLE_CHOICE_MAPPING_NAMES = OrderedDict(
434442
[
435443
# Model for Multiple Choice mapping
444+
("camembert", "CamembertForMultipleChoice"),
436445
("albert", "AlbertForMultipleChoice"),
437446
("bert", "BertForMultipleChoice"),
438447
("roberta", "RobertaForMultipleChoice"),
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
# Copyright 2024 The HuggingFace Team. All rights reserved.
2+
#
3+
# This code is adapted from https://github.com/huggingface/transformers
4+
# with modifications to run transformers on mindspore.
5+
#
6+
# Licensed under the Apache License, Version 2.0 (the "License");
7+
# you may not use this file except in compliance with the License.
8+
# You may obtain a copy of the License at
9+
#
10+
# http://www.apache.org/licenses/LICENSE-2.0
11+
#
12+
# Unless required by applicable law or agreed to in writing, software
13+
# distributed under the License is distributed on an "AS IS" BASIS,
14+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15+
# See the License for the specific language governing permissions and
16+
# limitations under the License.
17+
from .modeling_camembert import (
18+
CamembertForCausalLM,
19+
CamembertForMaskedLM,
20+
CamembertForMultipleChoice,
21+
CamembertForQuestionAnswering,
22+
CamembertForSequenceClassification,
23+
CamembertForTokenClassification,
24+
CamembertModel,
25+
CamembertPreTrainedModel,
26+
)

0 commit comments

Comments
 (0)