We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 030879f commit ad06609Copy full SHA for ad06609
torchtitan/models/moe.py
@@ -216,7 +216,7 @@ def forward(
216
elif self.score_func == "softmax":
217
scores = F.softmax(scores.to(torch.float32), dim=1)
218
else:
219
- raise NotImplementedError(f"Unknown score function {self.score_function}")
+ raise NotImplementedError(f"Unknown score function {self.score_func}")
220
221
# top scores shape (bs*slen, top_k)
222
# NOTE: The expert_bias is only used for routing. The gating value
0 commit comments