mask to bool for bloom fwd

younesbelkada · younesbelkada · commit 2bdbf2da5829 · 2023-11-22T08:31:35.000Z
diff --git a/src/petals/models/bloom/block.py b/src/petals/models/bloom/block.py
@@ -27,13 +27,17 @@ def forward(
         attention_mask = torch.ones((batch_size, seq_length_with_past), device=hidden_states.device)
         if alibi is None:
             alibi = build_alibi_tensor(attention_mask, num_heads=self.num_heads, dtype=hidden_states.dtype)
-        fake_inputs_embeds = torch.tensor([42], dtype=torch.float32)
+        
+        # _prepare_4d only needs inputs_embeds.dtype. And it is changed to bool before .forward() anyways
+        fake_inputs_embeds = torch.tensor([42], dtype=torch.float32)  
+
         attention_mask = _prepare_4d_causal_attention_mask(
             attention_mask=attention_mask,
             input_shape=(batch_size, seq_length),
             inputs_embeds=fake_inputs_embeds,
             past_key_values_length=past_length,
         )
+        attention_mask = attention_mask.bool()  # consistent with https://github.com/huggingface/transformers/pull/27086
         return super().forward(
             hidden_states, *args, attention_mask=attention_mask, alibi=alibi, layer_past=layer_past, **kwargs
         )