@@ -492,16 +492,19 @@ def update_and_add_testing_config(
492492 "qwen_2" ,
493493 # TODO: replace
494494 updates = {
495- ("model" , "base_model" , "decoder" , "block" , "add_linear_biases" ): "only_attn_qkv" ,
495+ ("model" , "base_model" , "decoder" , "block" , "mixer" , "query_layer" , "bias" , "enabled" ): True ,
496+ ("model" , "base_model" , "decoder" , "block" , "mixer" , "key_layer" , "bias" , "enabled" ): True ,
497+ ("model" , "base_model" , "decoder" , "block" , "mixer" , "value_layer" , "bias" , "enabled" ): True ,
498+ ("model" , "base_model" , "decoder" , "block" , "mixer" , "dense_layer" , "bias" , "enabled" ): False ,
496499 },
497500 # Megatron doesn't support per sub layer biases.
498501 megatron_args = None ,
499502 checkpoint_format = Qwen2CheckpointFormat ,
500503 # TODO: Add back generate as `normal` when stable.
501504 groups = {
502- ModelTestingGroup .basic : ModelTestingGroupAction .broken ,
503- ModelTestingGroup .checkpoint : ModelTestingGroupAction .broken ,
504- ModelTestingGroup .convert : ModelTestingGroupAction .broken ,
505+ ModelTestingGroup .basic : ModelTestingGroupAction .normal ,
506+ ModelTestingGroup .checkpoint : ModelTestingGroupAction .normal ,
507+ ModelTestingGroup .convert : ModelTestingGroupAction .normal ,
505508 ModelTestingGroup .generate : ModelTestingGroupAction .broken ,
506509 ModelTestingGroup .megatron : ModelTestingGroupAction .not_implemented ,
507510 ModelTestingGroup .distributed : ModelTestingGroupAction .unimportant ,
0 commit comments