Skip to content

Commit 126f42d

Browse files
authored
Fix for the qwen test config (#437)
1 parent 4ee9713 commit 126f42d

File tree

1 file changed

+7
-4
lines changed

1 file changed

+7
-4
lines changed

tests/utils/model_configs.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -492,16 +492,19 @@ def update_and_add_testing_config(
492492
"qwen_2",
493493
# TODO: replace
494494
updates={
495-
("model", "base_model", "decoder", "block", "add_linear_biases"): "only_attn_qkv",
495+
("model", "base_model", "decoder", "block", "mixer", "query_layer", "bias", "enabled"): True,
496+
("model", "base_model", "decoder", "block", "mixer", "key_layer", "bias", "enabled"): True,
497+
("model", "base_model", "decoder", "block", "mixer", "value_layer", "bias", "enabled"): True,
498+
("model", "base_model", "decoder", "block", "mixer", "dense_layer", "bias", "enabled"): False,
496499
},
497500
# Megatron doesn't support per sub layer biases.
498501
megatron_args=None,
499502
checkpoint_format=Qwen2CheckpointFormat,
500503
# TODO: Add back generate as `normal` when stable.
501504
groups={
502-
ModelTestingGroup.basic: ModelTestingGroupAction.broken,
503-
ModelTestingGroup.checkpoint: ModelTestingGroupAction.broken,
504-
ModelTestingGroup.convert: ModelTestingGroupAction.broken,
505+
ModelTestingGroup.basic: ModelTestingGroupAction.normal,
506+
ModelTestingGroup.checkpoint: ModelTestingGroupAction.normal,
507+
ModelTestingGroup.convert: ModelTestingGroupAction.normal,
505508
ModelTestingGroup.generate: ModelTestingGroupAction.broken,
506509
ModelTestingGroup.megatron: ModelTestingGroupAction.not_implemented,
507510
ModelTestingGroup.distributed: ModelTestingGroupAction.unimportant,

0 commit comments

Comments
 (0)