Skip to content

Commit 61bab95

Browse files
committed
update gru
Signed-off-by: Mayank Mishra <mayank31398@gmail.com>
1 parent 6e1bb32 commit 61bab95

File tree

2 files changed

+0
-2
lines changed
  • lm_engine/hf_models/modeling_utils/sequence_mixer_blocks

2 files changed

+0
-2
lines changed

lm_engine/hf_models/modeling_utils/sequence_mixer_blocks/gru.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -132,7 +132,6 @@ def __init__(
132132

133133
self.norm = get_normalization_function(normalization_function, self.state_size)
134134

135-
mark_parameter_as_mup_learning_rate(self.conv1d.weight)
136135
mark_parameter_as_mup_learning_rate(self.input_projection.weight)
137136
mark_parameter_as_mup_learning_rate(self.state_weight)
138137
mark_parameter_as_mup_learning_rate(self.output_projection.weight)

lm_engine/hf_models/modeling_utils/sequence_mixer_blocks/rnn.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,6 @@ def __init__(
101101

102102
self.norm = get_normalization_function(normalization_function, self.state_size)
103103

104-
mark_parameter_as_mup_learning_rate(self.conv1d.weight)
105104
mark_parameter_as_mup_learning_rate(self.input_projection.weight)
106105
mark_parameter_as_mup_learning_rate(self.state_weight)
107106
mark_parameter_as_mup_learning_rate(self.output_projection.weight)

0 commit comments

Comments
 (0)