We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a2deb0d commit 8fbabf8Copy full SHA for 8fbabf8
keras_hub/src/models/smollm3/smollm3_utils.py
@@ -38,6 +38,7 @@ def eager_attention_forward(
38
dropout=0.0,
39
training=False,
40
):
41
+ print('training', training)
42
key_states = repeat_kv(key, module.num_key_value_groups)
43
value_states = repeat_kv(value, module.num_key_value_groups)
44
0 commit comments