Skip to content

Commit 05ad6a7

Browse files
authored
Rename Mixtral bridges to be in line with new naming scheme (#1057)
1 parent 5b4cfae commit 05ad6a7

File tree

1 file changed

+8
-8
lines changed
  • transformer_lens/model_bridge/supported_architectures

1 file changed

+8
-8
lines changed

transformer_lens/model_bridge/supported_architectures/mixtral.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -89,22 +89,22 @@ def __init__(self, cfg: Any) -> None:
8989
name="self_attn",
9090
config=self.cfg,
9191
submodules={
92-
"W_Q": LinearBridge(name="q_proj"),
93-
"W_K": LinearBridge(name="k_proj"),
94-
"W_V": LinearBridge(name="v_proj"),
95-
"W_O": LinearBridge(name="o_proj"),
92+
"q": LinearBridge(name="q_proj"),
93+
"k": LinearBridge(name="k_proj"),
94+
"v": LinearBridge(name="v_proj"),
95+
"o": LinearBridge(name="o_proj"),
9696
},
9797
),
9898
"mlp": MoEBridge(
9999
name="block_sparse_moe",
100100
submodules={
101-
"W_gate": LinearBridge(name="gate"),
101+
"gate": LinearBridge(name="gate"),
102102
"experts": BlockBridge(
103103
name="experts",
104104
submodules={
105-
"W_gate": LinearBridge(name="w1"),
106-
"W_in": LinearBridge(name="w3"),
107-
"W_out": LinearBridge(name="w2"),
105+
"gate": LinearBridge(name="w1"),
106+
"in": LinearBridge(name="w3"),
107+
"out": LinearBridge(name="w2"),
108108
},
109109
),
110110
},

0 commit comments

Comments
 (0)