We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 72dc153 commit ba1cc7bCopy full SHA for ba1cc7b
paddlenlp/transformers/deepseek_v2/modeling.py
@@ -2354,7 +2354,7 @@ def __init__(
2354
2355
self.enorm = DeepseekV2RMSNorm(config)
2356
self.hnorm = DeepseekV2RMSNorm(config)
2357
- self.eh_proj = nn.Linear(2 * config.hidden_size, config.hidden_size)
+ self.eh_proj = nn.Linear(2 * config.hidden_size, config.hidden_size, bias_attr=False)
2358
2359
def forward(
2360
self,
0 commit comments