We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5be137b commit c45f589Copy full SHA for c45f589
keras_hub/src/models/smollm3/smollm3_utils.py
@@ -47,6 +47,7 @@ def eager_attention_forward(
47
)
48
49
# Apply attention mask if provided
50
+ print("attention_mask", attention_mask)
51
if attention_mask is not None:
52
causal_mask = attention_mask[:, :, :, : ops.shape(key_states)[-2]]
53
attn_weights = ops.add(attn_weights, causal_mask)
0 commit comments