flashinfer-ai
diff --git a/‎flashinfer/__init__.py
Lines changed: 1 addition & 0 deletions b/‎flashinfer/__init__.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎flashinfer/utils.py
Lines changed: 17 additions & 0 deletions b/‎flashinfer/utils.py
Lines changed: 17 additions & 0 deletions
@@ -117,3 +117,4 @@
 from .sampling import top_p_renorm_probs as top_p_renorm_probs
 from .sampling import top_p_sampling_from_probs as top_p_sampling_from_probs
 from .sparse import BlockSparseAttentionWrapper as BlockSparseAttentionWrapper
+from .utils import next_positive_power_of_2 as next_positive_power_of_2
@@ -84,6 +84,23 @@ def _expand_4d(x: torch.Tensor, kv_layout: str) -> torch.Tensor:
     return x
 
 
+def next_positive_power_of_2(x: int) -> int:
+    if x < 1:
+        return 1
+
+    # Following code is equivalent to 1 << (x - 1).bit_length()
+    # But this impl does not contain bit_length() so can be used by torch compile.
+    # It can correctly handle 64bit number which should be enough for now.
+    n = x - 1
+    n |= n >> 1
+    n |= n >> 2
+    n |= n >> 4
+    n |= n >> 8
+    n |= n >> 16
+    n |= n >> 32
+    return n + 1
+
+
 def _check_pos_encoding_mode(pos_encoding_mode: str) -> None:
     if not hasattr(PosEncodingMode, pos_encoding_mode):
         raise KeyError("Invalid pos_encoding_mode {}".format(pos_encoding_mode))