We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 4a69804 commit 653ad38Copy full SHA for 653ad38
primus/configs/models/megatron/language_model.yaml
@@ -68,6 +68,7 @@ attention_softmax_in_fp32: false
68
# fusion
69
bias_gelu_fusion: true
70
cross_entropy_loss_fusion: False
71
+cross_entropy_fusion_impl: "native" # "native", "te"
72
bias_swiglu_fusion: true
73
masked_softmax_fusion: true
74
no_persist_layer_norm: false
0 commit comments