File tree Expand file tree Collapse file tree 2 files changed +0
-2
lines changed Expand file tree Collapse file tree 2 files changed +0
-2
lines changed Original file line number Diff line number Diff line change @@ -270,7 +270,6 @@ def mistral_for_causal_lm_forward(
270
270
shift_labels = labels [..., 1 :].contiguous ()
271
271
# Flatten the tokens
272
272
loss_fct = CrossEntropyLoss ()
273
- #shift_logits = shift_logits.view(-1, self.config.vocab_size)
274
273
shift_labels = shift_labels .view (- 1 )
275
274
# Enable model parallelism
276
275
shift_labels = shift_labels .to (shift_logits .device )
Original file line number Diff line number Diff line change @@ -277,7 +277,6 @@ def module_policy(self):
277
277
suffix = "lm_head" ,
278
278
target_module = VocabParallelLMHead1D ,
279
279
kwargs = {
280
- #gather_output=True,
281
280
"gather_output" : not self .shard_config .parallel_output ,
282
281
"make_vocab_size_divisible_by" : self .shard_config .make_vocab_size_divisible_by ,
283
282
},
You can’t perform that action at this time.
0 commit comments