We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7a4cc3e commit 5d01df8Copy full SHA for 5d01df8
tests/unit_tests/models/deepseek_v3/test_dsv3_layers.py
@@ -201,6 +201,7 @@ def create_mock_config(self, **overrides):
201
config.hidden_size = 4096
202
config.rope_scaling = None
203
config.max_position_embeddings = 4096
204
+ config.rms_norm_eps = 1e-6
205
206
# Apply overrides
207
for key, value in overrides.items():
@@ -358,6 +359,7 @@ def create_mock_config(self, **overrides):
358
359
config.hidden_size = 1024
360
361
362
363
364
365
setattr(config, key, value)
@@ -480,6 +482,7 @@ def create_mock_config(self, **overrides):
480
482
481
483
484
485
486
487
488
0 commit comments